From 729b44082d80c733916daea5cd42a5eb600af535 Mon Sep 17 00:00:00 2001
From: Bob Caddy <r.Caddy@pitt.edu>
Date: Mon, 19 Dec 2022 14:01:59 -0500
Subject: [PATCH 01/18] Add Preliminary MHD Intergrater

This commit primarily adds support for MHD to the Van Leer 3D
integrator along with myriad small fixes and modifications. All new
features have tests as well.

The MHD implementation still has bugs but needs to be merged in before
we reformat the code so that the merging doesn't provoke too many
merge conflicts.

MHD

- Add MHD support to Van Leer 3D integrator
- All MHD code is in the `mhd` namespace with sub-namespaces when
  relevant (e.g. `mhd::utils`)
- Add kernel to compute the CT electric fields and tests for it
- Add kernel to update the magnetic field and tests for it
- Add MHD support to the PCM reconstruction
- Add new `Linear_Wave` initial condition type
- Add `ctElectricFields` global device array
- Set all MHD input parameters to default to zero
- Remove incorrect MHD specializations in the boundary conditions
- Add check to make sure MHD has at least 3 ghost cells
- Add functions to compute the maximum magnetic divergence, report it,
  and exit if it's too large
- Clean up make.type.mhd and enable cuda error checking
- Add example parameter files for
  - Alfven wave
  - Fast magnetosonic wave
  - Slow magnetosonic wave
  - Ryu & Jones 1995 shock tubes 1a and 2a
- Add the following input parameters for generalized linear waves
  - EigenVec_rho
  - EigenVec_MomentumX
  - EigenVec_MomentumY
  - EigenVec_MomentumZ
  - EigenVec_E
  - EigenVec_Bx
  - EigenVec_By
  - EigenVec_Bz
  - pitch
  - yaw
- Added MHD system tests for:
  - Hydro only constant state test
  - MHD constant state
  - Sod test that works with PCM (this will be merged with the hydro
    test when MHD supports PPMC)
  - All 4 MHD linear waves
  - MHD Einfeldt strong rarefaction

Testing

- Add new method, `runL1ErrorTest`, to `SystemTestRunner` that
  computes the L1 error compared to the initial conditions. Ideal for
  wave tests
- Updated hydro wave tests to use new `runL1ErrorTest` method

HLLD Riemann Solver

- Updated interface state indexing for new format
- Added documentation
- Moved dot product function to `math_utils`

Reductions

- Add new FP atomic max that works on CUDA or ROCm
- Update time step calculation to use the grid reduction with atomic
  and DeviceVector
- Updated tests to match
- Remove dev_dti, host_dti_array, and dev_dti_array global variables

Utilities

Cuda Utilities

- Add function `initGpuMemory` which initializes GPU memory so the
  CUDA compute sanitizer doesn't complain about it. Used to initialize
  all GPU arrays that I know of.
- Add struct `AutomaticLaunchParams` which is a thin wrapper over the
  occupancy API. Primarily intended for reductions where performance
  is sensitive to the number of blocks but could be used for any
  kernel launch

DeviceVector

- New option to initialize memory

Math Utilities

New namespace and file for math utilities. Currently contains a
semi-general rotation and dot product functions

MHD Utilities

- The `mhd::utils::computeEnergy` function now works properly with
  either MHD or hydro and returns the appropriate energy

Other

- Add a function `to_string_exact` to convert floating point numbers
  to a string such that it can be exactly deserialized back from a
  string to the same floating point number. Used in tests currently
---
 .gitmodules                                   |   3 +
 Makefile                                      |   6 +-
 builds/make.host.c3po                         |   6 +-
 builds/make.host.spock                        |   1 +
 builds/make.type.mhd                          |  21 +-
 cholla-tests-data                             |   2 +-
 examples/1D/sound_wave.txt                    |   7 +-
 examples/2D/sound_wave.txt                    |   7 +-
 examples/3D/Brio_and_Wu.txt                   |   6 +-
 examples/3D/Ryu_and_Jones_1a.txt              |  74 ++
 examples/3D/Ryu_and_Jones_2a.txt              |  74 ++
 examples/3D/alfven_wave.txt                   |  71 ++
 examples/3D/constant.txt                      |   6 +-
 examples/3D/fast_magnetosonic.txt             |  71 ++
 examples/3D/mhd_contact_wave.txt              |  71 ++
 examples/3D/slow_magnetosonic.txt             |  72 ++
 examples/3D/sound_wave.txt                    |   7 +-
 src/global/global.cpp                         |  20 +
 src/global/global.h                           |  20 +-
 src/global/global_cuda.cu                     |   6 +-
 src/global/global_cuda.h                      |  12 +-
 src/grid/boundary_conditions.cpp              |   6 +-
 src/grid/cuda_boundaries.cu                   |  85 +--
 src/grid/grid3D.cpp                           |  78 ++-
 src/grid/grid3D.h                             |  64 +-
 src/grid/initial_conditions.cpp               | 127 ++--
 src/hydro/hydro_cuda.cu                       |  94 ++-
 src/hydro/hydro_cuda_tests.cu                 |  36 +-
 src/integrators/VL_3D_cuda.cu                 | 162 +++--
 src/io/io.h                                   |  19 +
 src/main.cpp                                  |  17 +-
 src/mhd/ct_electric_fields.cu                 | 340 ++++++++++
 src/mhd/ct_electric_fields.h                  | 155 +++++
 src/mhd/ct_electric_fields_tests.cu           | 207 ++++++
 src/mhd/magnetic_divergence.cu                | 112 +++
 src/mhd/magnetic_divergence.h                 |  81 +++
 src/mhd/magnetic_divergence_tests.cu          |  59 ++
 src/mhd/magnetic_update.cu                    |  80 +++
 src/mhd/magnetic_update.h                     |  57 ++
 src/mhd/magnetic_update_tests.cu              | 150 +++++
 src/reconstruction/pcm_cuda.cu                | 378 +++++------
 src/reconstruction/plmc_cuda.cu               |  84 +--
 src/reconstruction/plmp_cuda.cu               |  46 +-
 src/reconstruction/ppmc_cuda.cu               | 122 ++--
 src/reconstruction/ppmp_cuda.cu               |  80 +--
 src/riemann_solvers/hlld_cuda.cu              | 160 ++---
 src/riemann_solvers/hlld_cuda.h               |  63 +-
 src/riemann_solvers/hlld_cuda_tests.cu        | 260 +++----
 src/system_tests/hydro_system_tests.cpp       | 221 +++++-
 .../input_files/blank_settings_file.txt       |   3 +
 ...stant_CorrectInputExpectCorrectOutput.txt} |   0
 ...ave3D_CorrectInputExpectCorrectOutput.txt} |  21 +-
 ...icFieldCorrectInputExpectCorrectOutput.txt |  50 ++
 ...icFieldCorrectInputExpectCorrectOutput.txt |  50 ++
 ...action_CorrectInputExpectCorrectOutput.txt |  71 ++
 ...zedMpi_CorrectInputExpectCorrectOutput.txt |  57 ++
 src/system_tests/mhd_system_tests.cpp         | 636 ++++++++++++++++++
 src/system_tests/system_tester.cpp            | 209 +++++-
 src/system_tests/system_tester.h              |  32 +-
 src/utils/DeviceVector.h                      |  22 +-
 src/utils/DeviceVector_tests.cu               |   7 +-
 src/utils/cuda_utilities.h                    |  75 ++-
 src/utils/cuda_utilities_tests.cpp            |  20 -
 src/utils/gpu.hpp                             |  10 +-
 src/utils/hydro_utilities.h                   |  34 +
 src/utils/hydro_utilities_tests.cpp           |  42 ++
 src/utils/math_utilities.h                    |  92 +++
 src/utils/math_utilities_tests.cpp            |  64 ++
 src/utils/mhd_utilities.cpp                   |  18 -
 src/utils/mhd_utilities.cu                    |  25 +
 src/utils/mhd_utilities.h                     |  97 ++-
 ...ities_tests.cpp => mhd_utilities_tests.cu} | 120 ++--
 src/utils/reduction_utilities.cu              |  14 -
 src/utils/reduction_utilities.h               | 191 ++++--
 src/utils/reduction_utilities_tests.cu        |  44 +-
 src/utils/testing_utilities.cpp               |  88 +--
 src/utils/testing_utilities.h                 |  63 +-
 77 files changed, 4765 insertions(+), 1296 deletions(-)
 create mode 100644 examples/3D/Ryu_and_Jones_1a.txt
 create mode 100644 examples/3D/Ryu_and_Jones_2a.txt
 create mode 100644 examples/3D/alfven_wave.txt
 create mode 100644 examples/3D/fast_magnetosonic.txt
 create mode 100644 examples/3D/mhd_contact_wave.txt
 create mode 100644 examples/3D/slow_magnetosonic.txt
 create mode 100644 src/mhd/ct_electric_fields.cu
 create mode 100644 src/mhd/ct_electric_fields.h
 create mode 100644 src/mhd/ct_electric_fields_tests.cu
 create mode 100644 src/mhd/magnetic_divergence.cu
 create mode 100644 src/mhd/magnetic_divergence.h
 create mode 100644 src/mhd/magnetic_divergence_tests.cu
 create mode 100644 src/mhd/magnetic_update.cu
 create mode 100644 src/mhd/magnetic_update.h
 create mode 100644 src/mhd/magnetic_update_tests.cu
 create mode 100644 src/system_tests/input_files/blank_settings_file.txt
 rename src/system_tests/input_files/{tHYDROSYSTEMConstant_CorrectInputExpectCorrectOutput.txt => tHYDROtMHDSYSTEMConstant_CorrectInputExpectCorrectOutput.txt} (100%)
 rename src/system_tests/input_files/{tHYDROSYSTEMSoundWave3D_CorrectInputExpectCorrectOutput.txt => tHYDROtMHDSYSTEMSoundWave3D_CorrectInputExpectCorrectOutput.txt} (70%)
 create mode 100644 src/system_tests/input_files/tMHDSYSTEMConstantParameterizedMpi_MagneticFieldCorrectInputExpectCorrectOutput.txt
 create mode 100644 src/system_tests/input_files/tMHDSYSTEMConstantParameterizedMpi_ZeroMagneticFieldCorrectInputExpectCorrectOutput.txt
 create mode 100644 src/system_tests/input_files/tMHDSYSTEMEinfeldtStrongRarefaction_CorrectInputExpectCorrectOutput.txt
 create mode 100644 src/system_tests/input_files/tMHDSYSTEMSodShockTubeParameterizedMpi_CorrectInputExpectCorrectOutput.txt
 create mode 100644 src/system_tests/mhd_system_tests.cpp
 create mode 100644 src/utils/math_utilities.h
 create mode 100644 src/utils/math_utilities_tests.cpp
 delete mode 100644 src/utils/mhd_utilities.cpp
 create mode 100644 src/utils/mhd_utilities.cu
 rename src/utils/{mhd_utilities_tests.cpp => mhd_utilities_tests.cu} (81%)

diff --git a/.gitmodules b/.gitmodules
index e69de29bb..c9a26c699 100644
--- a/.gitmodules
+++ b/.gitmodules
@@ -0,0 +1,3 @@
+[submodule "cholla-tests-data"]
+	path = cholla-tests-data
+	url = https://github.com/cholla-hydro/cholla-tests-data.git
diff --git a/Makefile b/Makefile
index dd1915537..dcc6d296c 100644
--- a/Makefile
+++ b/Makefile
@@ -10,7 +10,7 @@ CUDA_ARCH ?= sm_70
 
 DIRS     := src src/analysis src/chemistry_gpu src/cooling src/cooling_grackle src/cosmology \
             src/cpu src/global src/gravity src/gravity/paris src/grid src/hydro \
-            src/integrators src/io src/main.cpp src/main_tests.cpp \
+            src/integrators src/io src/main.cpp src/main_tests.cpp src/mhd\
             src/model src/mpi src/old_cholla src/particles src/reconstruction \
             src/riemann_solvers src/system_tests src/utils src/dust
 
@@ -38,6 +38,9 @@ ifeq ($(TEST), true)
   CFLAGS   += $(TEST_FLAGS)
   CXXFLAGS += $(TEST_FLAGS)
   GPUFLAGS += $(TEST_FLAGS)
+  CFLAGS   += $(TEST_FLAGS)
+  CXXFLAGS += $(TEST_FLAGS)
+  GPUFLAGS += $(TEST_FLAGS)
 
   # HACK
   # Set the build flags to debug. This is mostly to avoid the approximations
@@ -134,6 +137,7 @@ ifdef HIPCONFIG
   DFLAGS    += -DO_HIP
   CXXFLAGS  += $(HIPCONFIG)
   GPUCXX    ?= hipcc
+  GPUFLAGS  += -Wall -ferror-limit=1
   LD        := $(CXX)
   LDFLAGS   := $(CXXFLAGS) -L$(ROCM_PATH)/lib
   LIBS      += -lamdhip64
diff --git a/builds/make.host.c3po b/builds/make.host.c3po
index 79574201c..02f658896 100644
--- a/builds/make.host.c3po
+++ b/builds/make.host.c3po
@@ -3,13 +3,9 @@ CC                = mpicc
 CXX               = mpicxx
 CFLAGS_DEBUG      = -g -O0
 CFLAGS_OPTIMIZE   = -g -O2
-CXXFLAGS_DEBUG    = -g -O0 -std=c++11 ${F_OFFLOAD}
-CXXFLAGS_OPTIMIZE = -g -Ofast -std=c++11 ${F_OFFLOAD}
-GPUFLAGS_DEBUG    = -g -O0 -std=c++11 -ccbin=mpicxx
-GPUFLAGS_OPTIMIZE = -g -O3 -std=c++11 -ccbin=mpicxx
 CXXFLAGS_DEBUG    = -g -O0 -std=c++17 ${F_OFFLOAD}
 CXXFLAGS_OPTIMIZE = -g -Ofast -std=c++17 ${F_OFFLOAD}
-GPUFLAGS_DEBUG    = -g -G -cudart shared -O0 -std=c++17 -ccbin=mpicxx
+GPUFLAGS_DEBUG    = -g -G -cudart shared -O0 -std=c++17 -ccbin=mpicxx -Xcompiler -rdynamic
 GPUFLAGS_OPTIMIZE = -g -O3 -std=c++17 -ccbin=mpicxx
 
 OMP_NUM_THREADS   = 7
diff --git a/builds/make.host.spock b/builds/make.host.spock
index b839e95ae..8cac7c086 100644
--- a/builds/make.host.spock
+++ b/builds/make.host.spock
@@ -6,6 +6,7 @@ CXX               = CC
 
 CFLAGS_DEBUG      = -g -O0
 CFLAGS_OPTIMIZE   = -g -O2
+
 CXXFLAGS_DEBUG    = -g -O0 -std=c++17
 CXXFLAGS_OPTIMIZE = -g -Ofast -std=c++17
 
diff --git a/builds/make.type.mhd b/builds/make.type.mhd
index 3f67ea88f..486ba2547 100644
--- a/builds/make.type.mhd
+++ b/builds/make.type.mhd
@@ -9,15 +9,14 @@ MPI_GPU   ?=
 DFLAGS    += -DCUDA
 DFLAGS    += -DMPI_CHOLLA
 DFLAGS    += -DPRECISION=2
-DFLAGS    += -DPPMP
+# Currently MHD only supports PCM reconstruction. Higher order reconstruction
+# methods will be added later
+DFLAGS    += -DPCM
 DFLAGS    += -DHLLD
 DFLAGS    += -DMHD
 
-ifeq ($(findstring cosmology,$(TYPE)),cosmology)
-DFLAGS    += -DSIMPLE
-else
+# MHD only supports the Van Leer integrator
 DFLAGS    += -DVL
-endif
 
 # need this if using Disk_3D
 # DFLAGS += -DDISK_ICS
@@ -45,3 +44,15 @@ DFLAGS    += $(OUTPUT)
 #If not specified, MPI_GPU is off by default
 #This is set in the system make.host file
 DFLAGS    += $(MPI_GPU)
+
+# NOTE: The following macros are to help facilitate debugging and should not be
+# used on scientific runs
+
+# Do CUDA error checking
+DFLAGS += -DCUDA_ERROR_CHECK
+
+# Limit the number of steps to evolve.
+# DFLAGS += -DN_STEPS_LIMIT=1000
+
+# Output on every time step
+# DFLAGS += -DOUTPUT_ALWAYS
diff --git a/cholla-tests-data b/cholla-tests-data
index 66d592821..c069bb7a6 160000
--- a/cholla-tests-data
+++ b/cholla-tests-data
@@ -1 +1 @@
-Subproject commit 66d5928213b495c2fef61b0653b90a25ae3aa7cf
+Subproject commit c069bb7a6de79546f60d3ea47f6c10ba19df3c76
diff --git a/examples/1D/sound_wave.txt b/examples/1D/sound_wave.txt
index c6555c662..97b7c92b1 100644
--- a/examples/1D/sound_wave.txt
+++ b/examples/1D/sound_wave.txt
@@ -30,18 +30,17 @@ outdir=./
 
 #################################################
 # Parameters for linear wave problems
-# initial density 
+# initial density
 rho=1.0
-# velocity in the x direction 
+# velocity in the x direction
 vx=0
 # velocity in the y direction
 vy=0
 # velocity in the z direction
 vz=0
-# initial pressure 
+# initial pressure
 P=0.6
 # amplitude of perturbing oscillations
 A=1e-4
 # value of gamma
 gamma=1.666666666666667
-
diff --git a/examples/2D/sound_wave.txt b/examples/2D/sound_wave.txt
index d69b1270f..58608bac2 100644
--- a/examples/2D/sound_wave.txt
+++ b/examples/2D/sound_wave.txt
@@ -33,18 +33,17 @@ outdir=./
 
 #################################################
 # Parameters for linear wave problems
-# initial density 
+# initial density
 rho=1.0
-# velocity in the x direction 
+# velocity in the x direction
 vx=0
 # velocity in the y direction
 vy=0
 # velocity in the z direction
 vz=0
-# initial pressure 
+# initial pressure
 P=0.6
 # amplitude of perturbing oscillations
 A=1e-4
 # value of gamma
 gamma=1.666666666666667
-
diff --git a/examples/3D/Brio_and_Wu.txt b/examples/3D/Brio_and_Wu.txt
index a742ae207..fba126396 100644
--- a/examples/3D/Brio_and_Wu.txt
+++ b/examples/3D/Brio_and_Wu.txt
@@ -6,11 +6,11 @@
 
 ################################################
 # number of grid cells in the x dimension
-nx=32
+nx=256
 # number of grid cells in the y dimension
-ny=32
+ny=256
 # number of grid cells in the z dimension
-nz=32
+nz=256
 # final output time
 tout=0.1
 # time interval for output
diff --git a/examples/3D/Ryu_and_Jones_1a.txt b/examples/3D/Ryu_and_Jones_1a.txt
new file mode 100644
index 000000000..168fcdffa
--- /dev/null
+++ b/examples/3D/Ryu_and_Jones_1a.txt
@@ -0,0 +1,74 @@
+#
+# Parameter File for 3D Ryu & Jones MHD shock tube 4d.
+# Citation: Ryu & Jones 1995 "Numerical Magnetohydrodynamics in Astrophysics:
+# Algorithms and Tests for One-Dimensional Flow"
+#
+# Note: There are many shock tubes in this paper. This settings file is
+# specifically for shock tube 4d
+#
+
+################################################
+# number of grid cells in the x dimension
+nx=32
+# number of grid cells in the y dimension
+ny=32
+# number of grid cells in the z dimension
+nz=32
+# final output time
+tout=0.08
+# time interval for output
+outstep=0.08
+# name of initial conditions
+init=Riemann
+
+# domain properties
+xmin=0.0
+ymin=0.0
+zmin=0.0
+xlen=1.0
+ylen=1.0
+zlen=1.0
+
+# type of boundary conditions
+xl_bcnd=3
+xu_bcnd=3
+yl_bcnd=3
+yu_bcnd=3
+zl_bcnd=3
+zu_bcnd=3
+
+# path to output directory
+outdir=./
+
+#################################################
+# Parameters for 1D Riemann problems
+# density of left state
+rho_l=1.0
+# velocity of left state
+vx_l=10.0
+vy_l=0.0
+vz_l=0.0
+# pressure of left state
+P_l=20.0
+# Magnetic field of the left state
+Bx_l=1.4104739588693909
+By_l=1.4104739588693909
+Bz_l=0.0
+
+# density of right state
+rho_r=1.0
+# velocity of right state
+vx_r=-10.0
+vy_r=0.0
+vz_r=0.0
+# pressure of right state
+P_r=1.0
+# Magnetic field of the right state
+Bx_r=1.4104739588693909
+By_r=1.4104739588693909
+Bz_r=0.0
+
+# location of initial discontinuity
+diaph=0.5
+# value of gamma
+gamma=1.6666666666666667
diff --git a/examples/3D/Ryu_and_Jones_2a.txt b/examples/3D/Ryu_and_Jones_2a.txt
new file mode 100644
index 000000000..f886b4de3
--- /dev/null
+++ b/examples/3D/Ryu_and_Jones_2a.txt
@@ -0,0 +1,74 @@
+#
+# Parameter File for 3D Ryu & Jones MHD shock tube 4d.
+# Citation: Ryu & Jones 1995 "Numerical Magnetohydrodynamics in Astrophysics:
+# Algorithms and Tests for One-Dimensional Flow"
+#
+# Note: There are many shock tubes in this paper. This settings file is
+# specifically for shock tube 4d
+#
+
+################################################
+# number of grid cells in the x dimension
+nx=32
+# number of grid cells in the y dimension
+ny=32
+# number of grid cells in the z dimension
+nz=32
+# final output time
+tout=0.2
+# time interval for output
+outstep=0.2
+# name of initial conditions
+init=Riemann
+
+# domain properties
+xmin=0.0
+ymin=0.0
+zmin=0.0
+xlen=1.0
+ylen=1.0
+zlen=1.0
+
+# type of boundary conditions
+xl_bcnd=3
+xu_bcnd=3
+yl_bcnd=3
+yu_bcnd=3
+zl_bcnd=3
+zu_bcnd=3
+
+# path to output directory
+outdir=./
+
+#################################################
+# Parameters for 1D Riemann problems
+# density of left state
+rho_l=1.08
+# velocity of left state
+vx_l=1.2
+vy_l=0.01
+vz_l=0.5
+# pressure of left state
+P_l=0.95
+# Magnetic field of the left state
+Bx_l=7.0898154036220635
+By_l=1.0155412503859613
+Bz_l=0.5641895835477563
+
+# density of right state
+rho_r=1.0
+# velocity of right state
+vx_r=0.0
+vy_r=0.0
+vz_r=0.0
+# pressure of right state
+P_r=1.0
+# Magnetic field of the right state
+Bx_r=7.0898154036220635
+By_r=1.1283791670955126
+Bz_r=0.5641895835477563
+
+# location of initial discontinuity
+diaph=0.5
+# value of gamma
+gamma=1.6666666666666667
diff --git a/examples/3D/alfven_wave.txt b/examples/3D/alfven_wave.txt
new file mode 100644
index 000000000..bfacbc968
--- /dev/null
+++ b/examples/3D/alfven_wave.txt
@@ -0,0 +1,71 @@
+#
+# Parameter File for MHD Alfven Wave
+# See [this blog post](https://robertcaddy.com/posts/Classes-and-bugfixing-6/)
+# for details on each wave
+# The right eigenvector for this wave is:
+# (1/3) * [0, 0, +/-1, -/+2*sqrt(2), 0, -1, 2*sqrt(2), 0]
+# The terms with two sign options: use the left one for right moving waves and
+# the right one for left moving waves
+#
+
+################################################
+# number of grid cells in the x dimension
+nx=256
+# number of grid cells in the y dimension
+ny=256
+# number of grid cells in the z dimension
+nz=256
+# final output time
+tout=1.0
+# time interval for output
+outstep=1.0
+# name of initial conditions
+init=Linear_Wave
+# domain properties
+xmin=0.0
+ymin=0.0
+zmin=0.0
+xlen=1.0
+ylen=1.0
+zlen=1.0
+# type of boundary conditions
+xl_bcnd=1
+xu_bcnd=1
+yl_bcnd=1
+yu_bcnd=1
+zl_bcnd=1
+zu_bcnd=1
+# path to output directory
+outdir=./
+
+#################################################
+# Parameters for linear wave problems
+# initial density
+rho=1.0
+# velocity in the x direction
+vx=0
+# velocity in the y direction
+vy=0
+# velocity in the z direction
+vz=0
+# initial pressure
+P=0.6
+# magnetic field in the x direction
+Bx=1
+# magnetic field in the y direction
+By=1.5
+# magnetic field in the z direction
+Bz=0
+# amplitude of perturbing oscillations
+A=1e-6
+# value of gamma
+gamma=1.666666666666667
+# The right eigenvectors to set the wave properly
+rEigenVec_rho=0
+rEigenVec_MomentumX=0
+rEigenVec_MomentumY=0
+rEigenVec_MomentumZ=-1
+rEigenVec_Bx=0
+rEigenVec_By=0
+rEigenVec_Bz=1
+rEigenVec_E=0
diff --git a/examples/3D/constant.txt b/examples/3D/constant.txt
index ca3b411e2..871fbb7b7 100644
--- a/examples/3D/constant.txt
+++ b/examples/3D/constant.txt
@@ -42,9 +42,9 @@ vz=0
 # pressure
 P=1.380658e-5
 # Magnetic Field
-Bx=0.0
-By=0.0
-Bz=0.0
+Bx=1.0e-5
+By=2.0e-5
+Bz=3.0e-5
 # value of gamma
 gamma=1.666666667
 
diff --git a/examples/3D/fast_magnetosonic.txt b/examples/3D/fast_magnetosonic.txt
new file mode 100644
index 000000000..bc134a79a
--- /dev/null
+++ b/examples/3D/fast_magnetosonic.txt
@@ -0,0 +1,71 @@
+#
+# Parameter File for MHD fast magnetosonic wave
+# See [this blog post](https://robertcaddy.com/posts/Classes-and-bugfixing-6/)
+# for details on each wave.
+# The right eigenvector for this wave is:
+# (1/(6*sqrt(5))) * [6, +/-12, -/+4*sqrt(2), -/+2, 0,  8*sqrt(2), 4, 27]
+# The terms with two sign options: use the left one for right moving waves and
+# the right one for left moving waves
+#
+
+################################################
+# number of grid cells in the x dimension
+nx=256
+# number of grid cells in the y dimension
+ny=256
+# number of grid cells in the z dimension
+nz=256
+# final output time
+tout=0.5
+# time interval for output
+outstep=0.5
+# name of initial conditions
+init=Linear_Wave
+# domain properties
+xmin=0.0
+ymin=0.0
+zmin=0.0
+xlen=1.0
+ylen=1.0
+zlen=1.0
+# type of boundary conditions
+xl_bcnd=1
+xu_bcnd=1
+yl_bcnd=1
+yu_bcnd=1
+zl_bcnd=1
+zu_bcnd=1
+# path to output directory
+outdir=./
+
+#################################################
+# Parameters for linear wave problems
+# initial density
+rho=1.0
+# velocity in the x direction
+vx=0
+# velocity in the y direction
+vy=0
+# velocity in the z direction
+vz=0
+# initial pressure
+P=0.6
+# magnetic field in the x direction
+Bx=1
+# magnetic field in the y direction
+By=1.5
+# magnetic field in the z direction
+Bz=0
+# amplitude of perturbing oscillations
+A=1e-6
+# value of gamma
+gamma=1.666666666666667
+# The right eigenvectors to set the wave properly
+rEigenVec_rho=0.4472135954999579
+rEigenVec_MomentumX=0.8944271909999159
+rEigenVec_MomentumY=-0.4472135954999579
+rEigenVec_MomentumZ=0.0
+rEigenVec_Bx=0.0
+rEigenVec_By=0.8944271909999159
+rEigenVec_Bz=0.0
+rEigenVec_E=2.0124611797498106
diff --git a/examples/3D/mhd_contact_wave.txt b/examples/3D/mhd_contact_wave.txt
new file mode 100644
index 000000000..9250bba5a
--- /dev/null
+++ b/examples/3D/mhd_contact_wave.txt
@@ -0,0 +1,71 @@
+#
+# Parameter File for MHD contact wave
+# See [this blog post](https://robertcaddy.com/posts/Classes-and-bugfixing-6/)
+# for details on each wave
+# The right eigenvector for this wave is:
+# (1/2) * [2, +/-2, 0, 0, 0, 0, 0, 1]
+# The terms with two sign options: use the left one for right moving waves and
+# the right one for left moving waves
+#
+
+################################################
+# number of grid cells in the x dimension
+nx=256
+# number of grid cells in the y dimension
+ny=256
+# number of grid cells in the z dimension
+nz=256
+# final output time
+tout=1.0
+# time interval for output
+outstep=1.0
+# name of initial conditions
+init=Linear_Wave
+# domain properties
+xmin=0.0
+ymin=0.0
+zmin=0.0
+xlen=1.0
+ylen=1.0
+zlen=1.0
+# type of boundary conditions
+xl_bcnd=1
+xu_bcnd=1
+yl_bcnd=1
+yu_bcnd=1
+zl_bcnd=1
+zu_bcnd=1
+# path to output directory
+outdir=./
+
+#################################################
+# Parameters for linear wave problems
+# initial density
+rho=1.0
+# velocity in the x direction
+vx=1
+# velocity in the y direction
+vy=0
+# velocity in the z direction
+vz=0
+# initial pressure
+P=0.6
+# magnetic field in the x direction
+Bx=1
+# magnetic field in the y direction
+By=1.5
+# magnetic field in the z direction
+Bz=0
+# amplitude of perturbing oscillations
+A=1e-1
+# value of gamma
+gamma=1.666666666666667
+# The right eigenvectors to set the wave properly
+rEigenVec_rho=1.0
+rEigenVec_MomentumX=1.0
+rEigenVec_MomentumY=0.0
+rEigenVec_MomentumZ=0.0
+rEigenVec_Bx=0.0
+rEigenVec_By=0.0
+rEigenVec_Bz=0.0
+rEigenVec_E=0.5
diff --git a/examples/3D/slow_magnetosonic.txt b/examples/3D/slow_magnetosonic.txt
new file mode 100644
index 000000000..960952b5f
--- /dev/null
+++ b/examples/3D/slow_magnetosonic.txt
@@ -0,0 +1,72 @@
+#
+# Parameter File for MHD slow magnetosonic wave
+# See [this blog post](https://robertcaddy.com/posts/Classes-and-bugfixing-6/)
+# for details on each wave
+# The right eigenvector for this wave is:
+# (1/(6*sqrt(5))) * [12, +/-6, +/-8*sqrt(2), +/-4, 0, -4*sqrt(2), -2, 9]
+# The terms with two sign options: use the left one for right moving waves and
+# the right one for left moving waves
+#
+
+################################################
+# number of grid cells in the x dimension
+nx=256
+# number of grid cells in the y dimension
+ny=256
+# number of grid cells in the z dimension
+nz=256
+# final output time
+tout=2.0
+# time interval for output
+outstep=2.0
+# name of initial conditions
+init=Linear_Wave
+# domain properties
+xmin=0.0
+ymin=0.0
+zmin=0.0
+xlen=1.0
+ylen=1.0
+zlen=1.0
+# type of boundary conditions
+xl_bcnd=1
+xu_bcnd=1
+yl_bcnd=1
+yu_bcnd=1
+zl_bcnd=1
+zu_bcnd=1
+# path to output directory
+outdir=./
+
+#################################################
+# Parameters for linear wave problems
+# initial density
+rho=1.0
+# velocity in the x direction
+vx=0
+# velocity in the y direction
+vy=0
+# velocity in the z direction
+vz=0
+# initial pressure
+P=0.6
+# magnetic field in the x direction
+Bx=1
+# magnetic field in the y direction
+By=1.5
+# magnetic field in the z direction
+Bz=0
+# amplitude of perturbing oscillations
+A=1e-6
+# value of gamma
+gamma=1.666666666666667
+# The right eigenvectors to set the wave properly
+rEigenVec_rho=0.8944271909999159
+rEigenVec_MomentumX=0.4472135954999579
+rEigenVec_MomentumY=0.8944271909999159
+rEigenVec_MomentumZ=0.0
+rEigenVec_Bx=0.0
+rEigenVec_By=-0.4472135954999579
+rEigenVec_Bz=0.0
+rEigenVec_E=0.6708203932499369
+
diff --git a/examples/3D/sound_wave.txt b/examples/3D/sound_wave.txt
index 0f3866226..6c226c0ab 100644
--- a/examples/3D/sound_wave.txt
+++ b/examples/3D/sound_wave.txt
@@ -34,18 +34,17 @@ outdir=./
 
 #################################################
 # Parameters for linear wave problems
-# initial density 
+# initial density
 rho=1.0
-# velocity in the x direction 
+# velocity in the x direction
 vx=0
 # velocity in the y direction
 vy=0
 # velocity in the z direction
 vz=0
-# initial pressure 
+# initial pressure
 P=0.6
 # amplitude of perturbing oscillations
 A=1e-4
 # value of gamma
 gamma=1.666666666666667
-
diff --git a/src/global/global.cpp b/src/global/global.cpp
index 1f6a5cbfa..ab384144b 100644
--- a/src/global/global.cpp
+++ b/src/global/global.cpp
@@ -329,6 +329,26 @@ void parse_param(char *name,char *value, struct parameters *parms){
     parms->Bz_r = atof(value);
   else if (strcmp(name, "diaph")==0)
     parms->diaph = atof(value);
+  else if (strcmp(name, "rEigenVec_rho")==0)
+    parms->rEigenVec_rho = atof(value);
+  else if (strcmp(name, "rEigenVec_MomentumX")==0)
+    parms->rEigenVec_MomentumX = atof(value);
+  else if (strcmp(name, "rEigenVec_MomentumY")==0)
+    parms->rEigenVec_MomentumY = atof(value);
+  else if (strcmp(name, "rEigenVec_MomentumZ")==0)
+    parms->rEigenVec_MomentumZ = atof(value);
+  else if (strcmp(name, "rEigenVec_E")==0)
+      parms->rEigenVec_E = atof(value);
+  else if (strcmp(name, "rEigenVec_Bx")==0)
+    parms->rEigenVec_Bx = atof(value);
+  else if (strcmp(name, "rEigenVec_By")==0)
+    parms->rEigenVec_By = atof(value);
+  else if (strcmp(name, "rEigenVec_Bz")==0)
+    parms->rEigenVec_Bz = atof(value);
+  else if (strcmp(name, "pitch")==0)
+    parms->pitch = atof(value);
+  else if (strcmp(name, "yaw")==0)
+    parms->yaw = atof(value);
 #ifdef PARTICLES
   else if (strcmp(name, "prng_seed")==0)
     parms->prng_seed = atoi(value);
diff --git a/src/global/global.h b/src/global/global.h
index 79d3dbc88..50f0acf03 100644
--- a/src/global/global.h
+++ b/src/global/global.h
@@ -42,7 +42,7 @@ typedef double Real;
 #define MSUN_CGS 1.98847e33; //Msun in gr
 #define KPC_CGS 3.086e21;  //kpc in cm
 #define KM_CGS 1e5; //km in cm
-#define MH 1.67262171e-24 //Mass of hydrogen [g]   
+#define MH 1.67262171e-24 //Mass of hydrogen [g]
 
 #define TIME_UNIT 3.15569e10 // 1 kyr in s
 #define LENGTH_UNIT 3.08567758e21 // 1 kpc in cm
@@ -235,9 +235,9 @@ struct parameters
   Real vz;
   Real P;
   Real A;
-  Real Bx;
-  Real By;
-  Real Bz;
+  Real Bx=0;
+  Real By=0;
+  Real Bz=0;
   Real rho_l;
   Real vx_l;
   Real vy_l=0;
@@ -255,6 +255,16 @@ struct parameters
   Real By_r;
   Real Bz_r;
   Real diaph;
+  Real rEigenVec_rho = 0;
+  Real rEigenVec_MomentumX  = 0;
+  Real rEigenVec_MomentumY  = 0;
+  Real rEigenVec_MomentumZ  = 0;
+  Real rEigenVec_E   = 0;
+  Real rEigenVec_Bx  = 0;
+  Real rEigenVec_By  = 0;
+  Real rEigenVec_Bz  = 0;
+  Real pitch = 0;
+  Real yaw = 0;
 #ifdef PARTICLES
   // The random seed for particle simulations. With the default of 0 then a
   // machine dependent seed will be generated.
@@ -294,7 +304,7 @@ struct parameters
   int bc_potential_type;
 #if defined(COOLING_GRACKLE) || defined (CHEMISTRY_GPU)
   char UVB_rates_file[MAXLEN]; //File for the UVB photoheating and photoionization rates of HI, HeI and HeII
-#endif  
+#endif
 #ifdef ANALYSIS
   char analysis_scale_outputs_file[MAXLEN]; //File for the scale_factor output values for cosmological simulations {{}}
   char analysisdir[MAXLEN];
diff --git a/src/global/global_cuda.cu b/src/global/global_cuda.cu
index bd2e235c1..2153b1615 100644
--- a/src/global/global_cuda.cu
+++ b/src/global/global_cuda.cu
@@ -9,16 +9,12 @@
 bool memory_allocated;
 Real *dev_conserved, *dev_conserved_half;
 Real *Q_Lx, *Q_Rx, *Q_Ly, *Q_Ry, *Q_Lz, *Q_Rz, *F_x, *F_y, *F_z;
+Real *ctElectricFields;
 Real *eta_x, *eta_y, *eta_z, *etah_x, *etah_y, *etah_z;
-Real *dev_dti;
 
 //Arrays for potential in GPU: Will be set to NULL if not using GRAVITY
 Real *dev_grav_potential;
 Real *temp_potential;
 Real *buffer_potential;
 
-// Arrays for calc_dt
-Real *host_dti_array;
-Real *dev_dti_array;
-
 #endif //CUDA
diff --git a/src/global/global_cuda.h b/src/global/global_cuda.h
index 9150647c0..61cbc0752 100644
--- a/src/global/global_cuda.h
+++ b/src/global/global_cuda.h
@@ -25,14 +25,12 @@ extern bool memory_allocated; // Flag becomes true after allocating the memory o
 // conserved variables
 extern Real *dev_conserved, *dev_conserved_half;
 // input states and associated interface fluxes (Q* and F* from Stone, 2008)
+// Note that for hydro the size of these arrays is n_fields*n_cells*sizeof(Real)
+// while for MHD it is (n_fields-1)*n_cells*sizeof(Real), i.e. they has one
+// fewer field than you would expect
 extern Real *Q_Lx, *Q_Rx, *Q_Ly, *Q_Ry, *Q_Lz, *Q_Rz, *F_x, *F_y, *F_z;
-
-// Scalar for storing device side hydro/MHD time steps
-extern Real *dev_dti;
-
-// array of inverse timesteps for dt calculation (brought back by Alwin May 24 2022)
-extern Real *host_dti_array;
-extern Real *dev_dti_array;
+// Constrained transport electric fields
+extern Real *ctElectricFields;
 
 //Arrays for potential in GPU: Will be set to NULL if not using GRAVITY
 extern Real *dev_grav_potential;
diff --git a/src/grid/boundary_conditions.cpp b/src/grid/boundary_conditions.cpp
index aab040ede..afe0e0a42 100644
--- a/src/grid/boundary_conditions.cpp
+++ b/src/grid/boundary_conditions.cpp
@@ -38,14 +38,14 @@ void Grid3D::Set_Boundary_Conditions_Grid( parameters P){
   #ifdef GRAVITY
   #ifdef CPU_TIME
   Timer.Pot_Boundaries.Start();
-  #endif
+  #endif //CPU_TIME
   Grav.TRANSFER_POTENTIAL_BOUNDARIES = true;
   Set_Boundary_Conditions(P);
   Grav.TRANSFER_POTENTIAL_BOUNDARIES = false;
   #ifdef CPU_TIME
   Timer.Pot_Boundaries.End();
-  #endif
-  #endif
+  #endif //CPU_TIME
+  #endif //GRAVITY
 }
 
 /*! \fn void Set_Boundary_Conditions(parameters P)
diff --git a/src/grid/cuda_boundaries.cu b/src/grid/cuda_boundaries.cu
index f69ac3c59..8b689601e 100644
--- a/src/grid/cuda_boundaries.cu
+++ b/src/grid/cuda_boundaries.cu
@@ -3,9 +3,9 @@
 #include "../global/global_cuda.h"
 #include "cuda_boundaries.h"
 
-__device__ int FindIndex(int ig, int nx, int flag, int face, int n_ghost, Real *a, int &idMag);
+__device__ int FindIndex(int ig, int nx, int flag, int face, int n_ghost, Real *a);
 
-__device__ int SetBoundaryMapping(int ig, int jg, int kg, Real *a, int flags[],int nx, int ny, int nz, int n_ghost,  int &magneticIdx);
+__device__ int SetBoundaryMapping(int ig, int jg, int kg, Real *a, int flags[],int nx, int ny, int nz, int n_ghost);
 
 __global__ void PackBuffers3DKernel(Real * buffer, Real * c_head, int isize, int jsize, int ksize, int nx, int ny, int idxoffset, int buffer_ncells, int n_fields, int n_cells)
 {
@@ -66,7 +66,7 @@ __global__ void SetGhostCellsKernel(Real * c_head,
 				     int f0, int f1, int f2, int f3, int f4, int f5,
 				     int isize, int jsize, int ksize,
 				     int imin, int jmin, int kmin, int dir){
-  int id,i,j,k,gidx,idx,ii, magneticIdx;
+  int id,i,j,k,gidx,idx,ii;
   Real a[3] = {1.,1.,1.};
   int flags[6] = {f0,f1,f2,f3,f4,f5};
 
@@ -93,17 +93,11 @@ __global__ void SetGhostCellsKernel(Real * c_head,
   gidx = i + j*nx + k*nx*ny;
 
   // calculate idx (index of real cell) and a[:] for reflection
-  idx = SetBoundaryMapping(i,j,k,&a[0],flags,nx,ny,nz,n_ghost,magneticIdx);
+  idx = SetBoundaryMapping(i,j,k,&a[0],flags,nx,ny,nz,n_ghost);
 
   if (idx>=0){
     for (ii=0; ii<n_fields; ii++) {
-      #ifdef  MHD
-        // Choose which index to use, the one for magnetic fields or not
-        int index = ((5+NSCALARS <= ii) and ( ii <= 7+NSCALARS))? magneticIdx: idx;
-        c_head[gidx + ii*n_cells] = c_head[index + ii*n_cells];
-      #else // MHD not defined
-        c_head[gidx + ii*n_cells] = c_head[idx + ii*n_cells];
-      #endif  //MHD
+      c_head[gidx + ii*n_cells] = c_head[idx + ii*n_cells];
     }
     // momentum correction for reflection
     // these are set to -1 whenever ghost cells in a direction are in a reflective boundary condition
@@ -156,43 +150,33 @@ void SetGhostCells(Real * c_head,
 
 }
 
-__device__ int SetBoundaryMapping(int ig, int jg, int kg, Real *a, int flags[], int nx, int ny, int nz, int n_ghost, int &magneticIdx){
+__device__ int SetBoundaryMapping(int ig, int jg, int kg, Real *a, int flags[], int nx, int ny, int nz, int n_ghost){
   // nx, ny, nz, n_ghost
   /* 1D */
-  // irMag, jrMag, krMag are the magnetic indices
-  int ir, jr, kr, irMag, jrMag, krMag, idx;
-  ir=jr=kr=irMag=jrMag=krMag=idx=magneticIdx=0;
+  int ir, jr, kr, idx;
+  ir=jr=kr=idx=0;
   if (nx>1) {
 
     // set index on -x face
     if (ig < n_ghost) {
-      ir = FindIndex(ig, nx, flags[0], 0, n_ghost, &a[0], irMag);
+      ir = FindIndex(ig, nx, flags[0], 0, n_ghost, &a[0]);
     }
     // set index on +x face
     else if (ig >= nx-n_ghost) {
-      ir = FindIndex(ig, nx, flags[1], 1, n_ghost, &a[0], irMag);
+      ir = FindIndex(ig, nx, flags[1], 1, n_ghost, &a[0]);
     }
     // set i index for multi-D problems
     else {
       ir = ig;
-      #ifdef  MHD
-        irMag = ig;
-      #endif  //MHD
     }
 
     // if custom x boundaries are needed, set index to -1 and return
     if (ir < 0) {
-      #ifdef  MHD
-        magneticIdx = -1;
-      #endif  //MHD
       return idx = -1;
     }
 
     // otherwise add i index to ghost cell mapping
     idx += ir;
-    #ifdef  MHD
-      magneticIdx += irMag;
-    #endif  //MHD
 
   }
 
@@ -201,33 +185,24 @@ __device__ int SetBoundaryMapping(int ig, int jg, int kg, Real *a, int flags[],
 
     // set index on -y face
     if (jg < n_ghost) {
-      jr = FindIndex(jg, ny, flags[2], 0, n_ghost, &a[1], jrMag);
+      jr = FindIndex(jg, ny, flags[2], 0, n_ghost, &a[1]);
     }
     // set index on +y face
     else if (jg >= ny-n_ghost) {
-      jr = FindIndex(jg, ny, flags[3], 1, n_ghost, &a[1], jrMag);
+      jr = FindIndex(jg, ny, flags[3], 1, n_ghost, &a[1]);
     }
     // set j index for multi-D problems
     else {
       jr = jg;
-      #ifdef  MHD
-        jrMag = jg;
-      #endif  //MHD
     }
 
     // if custom y boundaries are needed, set index to -1 and return
     if (jr < 0) {
-      #ifdef  MHD
-        magneticIdx = -1;
-      #endif  //MHD
       return idx = -1;
     }
 
     // otherwise add j index to ghost cell mapping
     idx += nx*jr;
-    #ifdef  MHD
-      magneticIdx += nx*jrMag;
-    #endif  //MHD
 
   }
 
@@ -236,38 +211,29 @@ __device__ int SetBoundaryMapping(int ig, int jg, int kg, Real *a, int flags[],
 
     // set index on -z face
     if (kg < n_ghost) {
-      kr = FindIndex(kg, nz, flags[4], 0, n_ghost, &a[2], krMag);
+      kr = FindIndex(kg, nz, flags[4], 0, n_ghost, &a[2]);
     }
     // set index on +z face
     else if (kg >= nz-n_ghost) {
-      kr = FindIndex(kg, nz, flags[5], 1, n_ghost, &a[2], krMag);
+      kr = FindIndex(kg, nz, flags[5], 1, n_ghost, &a[2]);
     }
     // set k index for multi-D problems
     else {
       kr = kg;
-      #ifdef  MHD
-        krMag = kg;
-      #endif  //MHD
     }
 
     // if custom z boundaries are needed, set index to -1 and return
     if (kr < 0) {
-      #ifdef  MHD
-        magneticIdx = -1;
-      #endif  //MHD
       return idx = -1;
     }
 
     // otherwise add k index to ghost cell mapping
     idx += nx*ny*kr;
-    #ifdef  MHD
-      magneticIdx += nx*ny*krMag;
-    #endif  //MHD
   }
   return idx;
 }
 
-__device__ int FindIndex(int ig, int nx, int flag, int face, int n_ghost, Real *a, int &idMag){
+__device__ int FindIndex(int ig, int nx, int flag, int face, int n_ghost, Real *a){
   int id;
 
   // lower face
@@ -278,45 +244,27 @@ __device__ int FindIndex(int ig, int nx, int flag, int face, int n_ghost, Real *
       // periodic
       case 1:
         id = ig+nx-2*n_ghost;
-        #ifdef  MHD
-          idMag = id;
-        #endif  //MHD
         break;
       // reflective
       case 2:
         id = 2*n_ghost-ig-1;
         *(a) = -1.0;
-        #ifdef  MHD
-          idMag = id - 1;
-        #endif  //MHD
         break;
       // transmissive
       case 3:
         id = n_ghost;
-        #ifdef  MHD
-          idMag = id - 1;
-        #endif  //MHD
         break;
       // custom
       case 4:
         id = -1;
-        #ifdef  MHD
-          idMag = -1;
-        #endif  //MHD
         break;
       // MPI
       case 5:
         id = ig;
-        #ifdef  MHD
-          idMag = id;
-        #endif  //MHD
         break;
       // default is periodic
       default:
         id = ig+nx-2*n_ghost;
-        #ifdef  MHD
-          idMag = id;
-        #endif  //MHD
     }
   }
   // upper face
@@ -349,9 +297,6 @@ __device__ int FindIndex(int ig, int nx, int flag, int face, int n_ghost, Real *
       default:
         id = ig-nx+2*n_ghost;
     }
-    #ifdef  MHD
-      idMag = id;
-    #endif  //MHD
   }
   return id;
 }
diff --git a/src/grid/grid3D.cpp b/src/grid/grid3D.cpp
index e100def1c..cadcb3653 100644
--- a/src/grid/grid3D.cpp
+++ b/src/grid/grid3D.cpp
@@ -43,6 +43,10 @@
 #include "../dust/dust_cuda.h" // provides Dust_Update
 #endif
 
+#ifdef  MHD
+  #include "../mhd/magnetic_divergence.h"
+#endif  //MHD
+
 
 /*! \fn Grid3D(void)
  *  \brief Constructor for the Grid. */
@@ -72,6 +76,15 @@ Grid3D::Grid3D(void)
   H.n_ghost_potential_offset = H.n_ghost - N_GHOST_POTENTIAL;
   #endif
 
+  #ifdef  MHD
+    // Set the number of ghost cells high enough for MHD
+    if (H.n_ghost < 3)
+    {
+      chprintf("Insufficient number of ghost cells for MHD. H.n_ghost was %i, setting to 3.\n", H.n_ghost);
+      H.n_ghost = 3;
+    }
+  #endif  //MHD
+
 }
 
 /*! \fn void Get_Position(long i, long j, long k, Real *xpos, Real *ypos, Real *zpos)
@@ -139,7 +152,7 @@ void Grid3D::Initialize(struct parameters *P)
 
   // Set the CFL coefficient (a global variable)
   C_cfl = 0.3;
-  
+
   #ifdef AVERAGE_SLOW_CELLS
   H.min_dt_slow = 1e-100; //Initialize the minumum dt to a tiny number
   #endif // AVERAGE_SLOW_CELLS
@@ -296,6 +309,7 @@ void Grid3D::AllocateMemory(void)
 
   // allocate memory for the conserved variable arrays on the device
   CudaSafeCall( cudaMalloc((void**)&C.device, H.n_fields*H.n_cells*sizeof(Real)) );
+  cuda_utilities::initGpuMemory(C.device, H.n_fields*H.n_cells*sizeof(Real));
   C.d_density    = C.device;
   C.d_momentum_x = &(C.device[H.n_cells]);
   C.d_momentum_y = &(C.device[2*H.n_cells]);
@@ -316,14 +330,6 @@ void Grid3D::AllocateMemory(void)
   C.d_GasEnergy  = &(C.device[(H.n_fields-1)*H.n_cells]);
   #endif  // DE
 
-
-  // arrays that hold the max_dti calculation for hydro for each thread block (pre reduction)
-  int ngrid = (H.n_cells + TPB - 1) / TPB;
-  CudaSafeCall( cudaHostAlloc(&host_dti_array, ngrid*sizeof(Real), cudaHostAllocDefault) );
-  CudaSafeCall( cudaMalloc((void**)&dev_dti_array, ngrid*sizeof(Real)) );
-  CudaSafeCall( cudaMalloc((void**)&dev_dti, sizeof(Real)) );
-
-
   #if defined( GRAVITY )
   CudaSafeCall( cudaHostAlloc(&C.Grav_potential, H.n_cells*sizeof(Real), cudaHostAllocDefault) );
   CudaSafeCall( cudaMalloc((void**)&C.d_Grav_potential, H.n_cells*sizeof(Real)) );
@@ -451,7 +457,7 @@ Real Grid3D::Update_Grid(void)
     #ifdef VL
     VL_Algorithm_2D_CUDA(C.device, H.nx, H.ny, x_off, y_off, H.n_ghost, H.dx, H.dy, H.xbound, H.ybound, H.dt, H.n_fields);
     #endif //VL
-    #ifdef SIMPLE 
+    #ifdef SIMPLE
     Simple_Algorithm_2D_CUDA(C.device, H.nx, H.ny, x_off, y_off, H.n_ghost, H.dx, H.dy, H.xbound, H.ybound, H.dt, H.n_fields);
     #endif //SIMPLE
     #endif //CUDA
@@ -493,7 +499,7 @@ Real Grid3D::Update_Grid(void)
   Timer.Chemistry.RecordTime( Chem.H.runtime_chemistry_step );
   #endif
   #endif
-  
+
   #ifdef AVERAGE_SLOW_CELLS
   //Set the min_delta_t for averaging a slow cell
   Real max_dti_slow;
@@ -540,7 +546,7 @@ Real Grid3D::Update_Hydro_Grid( ){
   #ifdef ONLY_PARTICLES
   // Don't integrate the Hydro when only solving for particles
   return 1e-10;
-  #endif
+  #endif  //ONLY_PARTICLES
 
   Real dti;
 
@@ -551,26 +557,26 @@ Real Grid3D::Update_Hydro_Grid( ){
   #ifdef GRAVITY
   // Extrapolate gravitational potential for hydro step
   Extrapolate_Grav_Potential();
-  #endif
+  #endif  //GRAVITY
 
   dti = Update_Grid();
 
   #ifdef CPU_TIME
   #ifdef CHEMISTRY_GPU
   Timer.Hydro.Subtract(Chem.H.runtime_chemistry_step);
-  //Subtract the time spent on the Chemical Update 
-  #endif
+  //Subtract the time spent on the Chemical Update
+  #endif //CHEMISTRY_GPU
   Timer.Hydro.End();
   #endif //CPU_TIME
 
   #ifdef COOLING_GRACKLE
   #ifdef CPU_TIME
   Timer.Cooling.Start();
-  #endif
+  #endif  //CPU_TIME
   Do_Cooling_Step_Grackle( );
   #ifdef CPU_TIME
   Timer.Cooling.End();
-  #endif
+  #endif  //CPU_TIME
   #endif//COOLING_GRACKLE
 
 
@@ -603,6 +609,39 @@ void Grid3D::Update_Time(){
 
 }
 
+#ifdef  MHD
+  void Grid3D::checkMagneticDivergence(Grid3D &G, struct parameters P, int nfile)
+  {
+    // Compute the local value of the divergence
+    H.max_magnetic_divergence = mhd::launchCalculateMagneticDivergence(C.device, H.dx, H.dy, H.dz, H.nx, H.ny, H.nz, H.n_cells);
+
+    #ifdef  MPI_CHOLLA
+      // Now that we have the local maximum let's get the global maximum
+      H.max_magnetic_divergence =  ReduceRealMax(H.max_magnetic_divergence);
+    #endif  //MPI_CHOLLA
+
+    // If the magnetic divergence is greater than the limit then raise a warning and exit
+    if (H.max_magnetic_divergence > H.magnetic_divergence_limit)
+    {
+      // Report the error and exit
+      chprintf("The magnetic divergence has exceeded the maximum allowed value. Divergence = %7.4e, the maximum allowed divergence = %7.4e\n",
+               H.max_magnetic_divergence, H.magnetic_divergence_limit);
+      chexit(-1);
+    }
+    else if (H.max_magnetic_divergence < 0.0)
+    {
+      // Report the error and exit
+      chprintf("The magnetic divergence is negative. Divergence = %7.4e\n",
+               H.max_magnetic_divergence);
+      chexit(-1);
+    }
+    else  // The magnetic divergence is within acceptable bounds
+    {
+      chprintf("Global maximum magnetic divergence = %7.4e\n", H.max_magnetic_divergence);
+    }
+  }
+#endif  //MHD
+
 /*! \fn void Reset(void)
  *  \brief Reset the Grid3D class. */
 void Grid3D::Reset(void)
@@ -623,11 +662,6 @@ void Grid3D::FreeMemory(void)
   // free the conserved variable arrays
   CudaSafeCall( cudaFreeHost(C.host) );
 
-  // free the timestep arrays
-  CudaSafeCall( cudaFreeHost(host_dti_array) );
-  cudaFree(dev_dti_array);
-  cudaFree(dev_dti);
-
   #ifdef GRAVITY
   CudaSafeCall( cudaFreeHost(C.Grav_potential) );
   CudaSafeCall( cudaFree(C.d_Grav_potential) );
diff --git a/src/grid/grid3D.h b/src/grid/grid3D.h
index f121bd423..c98971189 100644
--- a/src/grid/grid3D.h
+++ b/src/grid/grid3D.h
@@ -245,6 +245,11 @@ struct Header
   Real sphere_center_y;
   Real sphere_center_z;
 
+  #ifdef  MHD
+    Real max_magnetic_divergence;
+    Real const magnetic_divergence_limit = 1.0E-14;
+  #endif  //MHD
+
 
   #ifdef GRAVITY
   /*! \var n_ghost_potential_offset
@@ -450,26 +455,6 @@ class Grid3D
     void set_dt_Gravity();
     #endif
 
-    /*! \fn Real calc_dti_CPU_1D()
-     *  \brief Calculate the maximum inverse timestep on 1D, according to the CFL condition (Toro 6.17). */
-    Real calc_dti_CPU_1D();
-
-    /*! \fn Real calc_dti_CPU_2D()
-     *  \brief Calculate the maximum inverse timestep on 2D, according to the CFL condition (Toro 6.17). */
-    Real calc_dti_CPU_2D();
-
-    /*! \fn Real calc_dti_CPU_3D_function()
-     *  \brief Calculate the maximum inverse timestep on 3D using openMP, according to the CFL condition (Toro 6.17). */
-    Real calc_dti_CPU_3D_function( int g_start, int g_end );
-
-    /*! \fn Real calc_dti_CPU_3D()
-     *  \brief Calculate the maximum inverse timestep on 3D, according to the CFL condition (Toro 6.17). */
-    Real calc_dti_CPU_3D();
-
-    /*! \fn Real calc_dti_CPU()
-     *  \brief Calculate the maximum inverse timestep, according to the CFL condition (Toro 6.17). */
-    Real calc_dti_CPU();
-
     /*! \fn void Update_Grid(void)
      *  \brief Update the conserved quantities in each cell. */
     Real Update_Grid(void);
@@ -480,6 +465,10 @@ class Grid3D
 
     void Update_Time();
 
+    #ifdef  MHD
+      void checkMagneticDivergence(Grid3D &G, struct parameters P, int nfile);
+    #endif  //MHD
+
      /*! \fn void Write_Header_Text(FILE *fp)
      *  \brief Write the relevant header info to a text output file. */
     void Write_Header_Text(FILE *fp);
@@ -553,6 +542,41 @@ class Grid3D
      *  \brief Sine wave perturbation. */
     void Sound_Wave(Real rho, Real vx, Real vy, Real vz, Real P, Real A);
 
+    /*!
+     * \brief Initialize the grid with a simple linear wave.
+     *
+     * \param[in] rho The background density
+     * \param[in] vx The background velocity in the X-direction
+     * \param[in] vy The background velocity in the Y-direction
+     * \param[in] vz The background velocity in the Z-direction
+     * \param[in] P The background pressure
+     * \param[in] A The amplitude of the wave
+     * \param[in] Bx The background magnetic field in the X-direction
+     * \param[in] By The background magnetic field in the Y-direction
+     * \param[in] Bz The background magnetic field in the Z-direction
+     * \param[in] rEigenVec_rho The right eigenvector component for the density
+     * \param[in] rEigenVec_MomentumX The right eigenvector component for the velocity
+     * in the X-direction
+     * \param[in] rEigenVec_MomentumY The right eigenvector component for the velocity
+     * in the Y-direction
+     * \param[in] rEigenVec_MomentumZ The right eigenvector component for the velocity
+     * in the Z-direction
+     * \param[in] rEigenVec_E The right eigenvector component for the energy
+     * \param[in] rEigenVec_Bx The right eigenvector component for the magnetic
+     * field in the X-direction
+     * \param[in] rEigenVec_By The right eigenvector component for the magnetic
+     * field in the Y-direction
+     * \param[in] rEigenVec_Bz The right eigenvector component for the magnetic
+     * field in the Z-direction
+     * \param[in] pitch The pitch angle of the linear wave
+     * \param[in] yaw The yaw angle of the linear wave
+     */
+    void Linear_Wave(Real rho, Real vx, Real vy, Real vz, Real P, Real A,
+                     Real Bx, Real By, Real Bz, Real rEigenVec_rho,
+                     Real rEigenVec_MomentumX, Real rEigenVec_MomentumY, Real rEigenVec_MomentumZ,
+                     Real rEigenVec_E, Real rEigenVec_Bx, Real rEigenVec_By,
+                     Real rEigenVec_Bz, Real pitch, Real yaw);
+
     /*! \fn void Square_Wave(Real rho, Real vx, Real vy, Real vz, Real P, Real A)
      *  \brief Square wave density perturbation with amplitude A*rho in pressure equilibrium. */
     void Square_Wave(Real rho, Real vx, Real vy, Real vz, Real P, Real A);
diff --git a/src/grid/initial_conditions.cpp b/src/grid/initial_conditions.cpp
index 4786fb446..5d98d8367 100644
--- a/src/grid/initial_conditions.cpp
+++ b/src/grid/initial_conditions.cpp
@@ -13,10 +13,13 @@
 #include "../mpi/mpi_routines.h"
 #include "../io/io.h"
 #include "../utils/error_handling.h"
+#include "../utils/mhd_utilities.h"
+#include "../utils/math_utilities.h"
 #include <stdio.h>
 #include <cmath>
 #include <iostream>
 #include <fstream>
+#include <algorithm>
 
 using namespace std;
 
@@ -31,6 +34,10 @@ void Grid3D::Set_Initial_Conditions(parameters P) {
     Constant(P.rho, P.vx, P.vy, P.vz, P.P, P.Bx, P.By, P.Bz);
   } else if (strcmp(P.init, "Sound_Wave")==0) {
     Sound_Wave(P.rho, P.vx, P.vy, P.vz, P.P, P.A);
+  } else if (strcmp(P.init, "Linear_Wave")==0) {
+    Linear_Wave(P.rho, P.vx, P.vy, P.vz, P.P, P.A, P.Bx, P.By, P.Bz,
+                P.rEigenVec_rho, P.rEigenVec_MomentumX, P.rEigenVec_MomentumY, P.rEigenVec_MomentumZ,
+                P.rEigenVec_E, P.rEigenVec_Bx, P.rEigenVec_By, P.rEigenVec_Bz, P.pitch, P.yaw);
   } else if (strcmp(P.init, "Square_Wave")==0) {
     Square_Wave(P.rho, P.vx, P.vy, P.vz, P.P, P.A);
   } else if (strcmp(P.init, "Riemann")==0) {
@@ -62,9 +69,9 @@ void Grid3D::Set_Initial_Conditions(parameters P) {
   } else if (strcmp(P.init, "Spherical_Overpressure_3D")==0) {
     Spherical_Overpressure_3D();
   } else if (strcmp(P.init, "Spherical_Overdensity_3D")==0) {
-    Spherical_Overdensity_3D();    
+    Spherical_Overdensity_3D();
   } else if (strcmp(P.init, "Clouds")==0) {
-    Clouds();    
+    Clouds();
   } else if (strcmp(P.init, "Read_Grid")==0) {
     #ifndef ONLY_PARTICLES
     Read_Grid(P);
@@ -116,8 +123,8 @@ void Grid3D::Set_Domain_Properties(struct parameters P)
   H.zblocal = H.zbound;
 
   H.xblocal_max = H.xblocal + P.xlen;
-  H.yblocal_max = H.yblocal + P.ylen; 
-  H.zblocal_max = H.zblocal + P.zlen; 
+  H.yblocal_max = H.yblocal + P.ylen;
+  H.zblocal_max = H.zblocal + P.zlen;
 
 #else
   Real nx_param = (Real) nx_global;
@@ -237,7 +244,6 @@ void Grid3D::Constant(Real rho, Real vx, Real vy, Real vz, Real P, Real Bx, Real
 
 }
 
-
 /*! \fn void Sound_Wave(Real rho, Real vx, Real vy, Real vz, Real P, Real A)
  *  \brief Sine wave perturbation. */
 void Grid3D::Sound_Wave(Real rho, Real vx, Real vy, Real vz, Real P, Real A)
@@ -291,6 +297,61 @@ void Grid3D::Sound_Wave(Real rho, Real vx, Real vy, Real vz, Real P, Real A)
         #ifdef DE
 	C.GasEnergy[id]  = P/(gama-1.0);
         #endif  //DE
+        #ifdef DE
+	C.GasEnergy[id]  = P/(gama-1.0);
+        #endif  //DE
+      }
+    }
+  }
+
+}
+
+/*! \fn void Linear_Wave(Real rho, Real vx, Real vy, Real vz, Real P, Real A)
+ *  \brief Sine wave perturbation. */
+void Grid3D::Linear_Wave(Real rho, Real vx, Real vy, Real vz, Real P, Real A,
+                        Real Bx, Real By, Real Bz, Real rEigenVec_rho,
+                        Real rEigenVec_MomentumX, Real rEigenVec_MomentumY, Real rEigenVec_MomentumZ,
+                        Real rEigenVec_E, Real rEigenVec_Bx, Real rEigenVec_By,
+                        Real rEigenVec_Bz, Real pitch, Real yaw)
+{
+  auto [stagger, junk1, junk2] = math_utils::rotateCoords<Real>(H.dx/2, H.dy/2, H.dz/2, pitch, yaw);
+
+  // set initial values of conserved variables
+  for(int k=H.n_ghost; k<H.nz-H.n_ghost; k++) {
+    for(int j=H.n_ghost; j<H.ny-H.n_ghost; j++) {
+      for(int i=H.n_ghost; i<H.nx-H.n_ghost; i++) {
+        // Rotate the indices
+        auto [i_rot, j_rot, k_rot] = math_utils::rotateCoords<int>(i, j, k, pitch, yaw);
+
+        //get cell index
+        int id = i + j*H.nx + k*H.nx*H.ny;
+
+        // get cell-centered position
+        Real x_pos, y_pos, z_pos;
+        Get_Position(i_rot, j_rot, k_rot, &x_pos, &y_pos, &z_pos);
+
+        // set constant initial states. Note that mhd::utils::computeEnergy
+        // computes the hydro energy if MHD is turned off
+        Real sine_wave = std::sin(2.0 * PI * x_pos);
+
+        C.density[id]    = rho;
+        C.momentum_x[id] = rho*vx;
+        C.momentum_y[id] = rho*vy;
+        C.momentum_z[id] = rho*vz;
+        C.Energy[id]     = mhd::utils::computeEnergy(P, rho, vx, vy, vz, Bx, By, Bz, gama);
+        // add small-amplitude perturbations
+        C.density[id]    += A * rEigenVec_rho       * sine_wave;
+        C.momentum_x[id] += A * rEigenVec_MomentumX * sine_wave;
+        C.momentum_y[id] += A * rEigenVec_MomentumY * sine_wave;
+        C.momentum_z[id] += A * rEigenVec_MomentumZ * sine_wave;
+        C.Energy[id]     += A * rEigenVec_E         * sine_wave;
+
+        #ifdef  MHD
+          sine_wave = std::sin(2.0 * PI * (x_pos+stagger));
+          C.magnetic_x[id] = Bx + A * rEigenVec_Bx * sine_wave;
+          C.magnetic_y[id] = By + A * rEigenVec_By * sine_wave;
+          C.magnetic_z[id] = Bz + A * rEigenVec_Bz * sine_wave;
+        #endif  //MHD
       }
     }
   }
@@ -405,26 +466,6 @@ void Grid3D::Riemann(Real rho_l, Real vx_l, Real vy_l, Real vz_l, Real P_l, Real
     kend   = H.nz;
   }
 
-  #ifdef MHD
-    auto setMagnetFields = [&] ()
-    {
-      Real x_pos_face = x_pos + 0.5 * H.dx;
-
-      if (x_pos_face < diaph)
-      {
-        C.magnetic_x[id] = Bx_l;
-        C.magnetic_y[id] = By_l;
-        C.magnetic_z[id] = Bz_l;
-      }
-      else
-      {
-        C.magnetic_x[id] = Bx_r;
-        C.magnetic_y[id] = By_r;
-        C.magnetic_z[id] = Bz_r;
-      }
-    };
-  #endif  // MHD
-
   // set initial values of conserved variables
   for(k=kstart-1; k<kend; k++) {
     for(j=jstart-1; j<jend; j++) {
@@ -439,7 +480,18 @@ void Grid3D::Riemann(Real rho_l, Real vx_l, Real vy_l, Real vz_l, Real P_l, Real
         #ifdef  MHD
           // Set the magnetic field including the rightmost ghost cell on the
           // left side which is really the left face of the first grid cell
-          setMagnetFields();
+          if (x_pos < diaph)
+          {
+            C.magnetic_x[id] = Bx_l;
+            C.magnetic_y[id] = By_l;
+            C.magnetic_z[id] = Bz_l;
+          }
+          else
+          {
+            C.magnetic_x[id] = Bx_r;
+            C.magnetic_y[id] = By_r;
+            C.magnetic_z[id] = Bz_r;
+          }
         #endif  //MHD
 
         // Exclude the rightmost ghost cell on the "left" side
@@ -451,7 +503,7 @@ void Grid3D::Riemann(Real rho_l, Real vx_l, Real vy_l, Real vz_l, Real P_l, Real
             C.momentum_x[id] = rho_l * vx_l;
             C.momentum_y[id] = rho_l * vy_l;
             C.momentum_z[id] = rho_l * vz_l;
-            C.Energy[id]     = P_l/(gama-1.0) + 0.5*rho_l*(vx_l*vx_l + vy_l*vy_l + vz_l*vz_l);
+            C.Energy[id]     = mhd::utils::computeEnergy(P_l, rho_l, vx_l, vy_l, vz_l, Bx_l, By_l, Bz_l, gama);
             #ifdef SCALAR
 	    #ifdef BASIC_SCALAR
             C.basic_scalar[id] = 1.0*rho_l;
@@ -467,7 +519,7 @@ void Grid3D::Riemann(Real rho_l, Real vx_l, Real vy_l, Real vz_l, Real P_l, Real
             C.momentum_x[id] = rho_r * vx_r;
             C.momentum_y[id] = rho_r * vy_r;
             C.momentum_z[id] = rho_r * vz_r;
-            C.Energy[id]     = P_r/(gama-1.0) + 0.5*rho_r*(vx_r*vx_r + vy_r*vy_r + vz_r*vz_r);
+            C.Energy[id]     = mhd::utils::computeEnergy(P_r, rho_r, vx_r, vy_r, vz_r, Bx_r, By_r, Bz_r, gama);
             #ifdef SCALAR
 	    #ifdef BASIC_SCALAR
             C.basic_scalar[id] = 0.0*rho_r;
@@ -569,7 +621,7 @@ void Grid3D::Blast_1D()
     #ifdef DE
     C.GasEnergy[id]  = P/(gama-1.0);
     #endif  //DE
-    
+
   }
 }
 
@@ -647,7 +699,7 @@ void Grid3D::KH()
           C.momentum_x[id] = v1*C.density[id];
           C.momentum_y[id] = C.density[id]*A*sin(4*PI*x_pos);
           C.momentum_z[id] = 0.0;
-       
+
           #ifdef SCALAR
 	  #ifdef BASIC_SCALAR
           C.basic_scalar[id] = 1.0*d1;
@@ -702,7 +754,7 @@ void Grid3D::KH_res_ind()
   dy = 0.05; // width of ramp function (see Robertson 2009)
   A = 0.1; // amplitude of the perturbation
 
-  // Note: ramp function from Robertson 2009 is 1/Ramp(y) = (1 + exp(2*(y-0.25)/dy))*(1 + exp(2*(0.75 - y)/dy));  
+  // Note: ramp function from Robertson 2009 is 1/Ramp(y) = (1 + exp(2*(y-0.25)/dy))*(1 + exp(2*(0.75 - y)/dy));
 
   // set the initial values of the conserved variables
   for (k=kstart; k<kend; k++) {
@@ -767,12 +819,12 @@ void Grid3D::KH_res_ind()
           C.momentum_y[id] = cos(phi) * C.density[id] * A*sin(4*PI*x_pos) * (1.0 - exp( -0.5*pow(r-0.25 + sqrt(-2.0*dy*dy*log(0.5)),2)/(dy*dy) ));
           C.momentum_z[id] = sin(phi) * C.density[id] * A*sin(4*PI*x_pos) * (1.0 - exp( -0.5*pow(r-0.25 + sqrt(-2.0*dy*dy*log(0.5)),2)/(dy*dy) ));
         }
-	
+
 	// No matter what we do with the density and momentum, set the Energy and GasEnergy appropriately
 	mx = C.momentum_x[id];
 	my = C.momentum_y[id];
 	mz = C.momentum_z[id];
-	C.Energy[id] = P/(gama-1.0) + 0.5*(mx*mx + my*my + mz*mz)/C.density[id];	
+	C.Energy[id] = P/(gama-1.0) + 0.5*(mx*mx + my*my + mz*mz)/C.density[id];
 
         #ifdef DE
 	C.GasEnergy[id]  = P/(gama-1.0);
@@ -1312,7 +1364,7 @@ void Grid3D::Clouds()
   for(k=kstart; k<kend; k++) {
     for(j=jstart; j<jend; j++) {
       for(i=istart; i<iend; i++) {
-	
+
         //get cell index
         id = i + j*H.nx + k*H.nx*H.ny;
 
@@ -1333,7 +1385,7 @@ void Grid3D::Clouds()
           C.basic_scalar[id] = C.density[id]*0.0;
         #endif
         #endif
-        // add clouds 
+        // add clouds
         for (int nn = 0; nn<N_cl; nn++) {
           r = sqrt((x_pos - cl_pos[nn][0])*(x_pos - cl_pos[nn][0]) + (y_pos - cl_pos[nn][1])*(y_pos - cl_pos[nn][1]) + (z_pos - cl_pos[nn][2])*(z_pos - cl_pos[nn][2]));
           if (r < R_cl) {
@@ -1628,8 +1680,3 @@ void Grid3D::Chemistry_Test( struct parameters P )
   #endif //COSMOLOGY
 
 }
-
-
-
-
-
diff --git a/src/hydro/hydro_cuda.cu b/src/hydro/hydro_cuda.cu
index c07162d7c..c9fa2b682 100644
--- a/src/hydro/hydro_cuda.cu
+++ b/src/hydro/hydro_cuda.cu
@@ -5,6 +5,7 @@
 #include <stdio.h>
 #include <math.h>
 #include <float.h>
+#include <limits>
 
 #include "../utils/gpu.hpp"
 #include "../global/global.h"
@@ -14,6 +15,7 @@
 #include "../utils/hydro_utilities.h"
 #include "../utils/cuda_utilities.h"
 #include "../utils/reduction_utilities.h"
+#include "../utils/DeviceVector.h"
 
 
 __global__ void Update_Conserved_Variables_1D(Real *dev_conserved, Real *dev_F, int n_cells, int x_off, int n_ghost, Real dx, Real xbound, Real dt, Real gamma, int n_fields)
@@ -425,8 +427,8 @@ __device__ __host__ Real mhdInverseCrossingTime(Real const &E,
                                                 Real const &gamma)
 {
   // Compute the gas pressure and fast magnetosonic speed
-  Real gasP = mhdUtils::computeGasPressure(E, d, vx*d, vy*d, vz*d, avgBx, avgBy, avgBz, gamma);
-  Real cf   = mhdUtils::fastMagnetosonicSpeed(d, gasP, avgBx, avgBy, avgBz, gamma);
+  Real gasP = mhd::utils::computeGasPressure(E, d, vx*d, vy*d, vz*d, avgBx, avgBy, avgBz, gamma);
+  Real cf   = mhd::utils::fastMagnetosonicSpeed(d, gasP, avgBx, avgBy, avgBz, gamma);
 
   // Find maximum inverse crossing time in the cell (i.e. minimum crossing time)
   Real cellMaxInverseDt = fmax((fabs(vx)+cf)/dx, (fabs(vy)+cf)/dy);
@@ -470,10 +472,8 @@ __global__ void Calc_dt_1D(Real *dev_conserved, Real *dev_dti, Real gamma, int n
     }
   }
 
-  // do the block wide reduction (find the max inverse timestep in the block)
-  // then write it to that block's location in the dev_dti array
-  max_dti = reduction_utilities::blockReduceMax(max_dti);
-  if (threadIdx.x == 0) dev_dti[blockIdx.x] = max_dti;
+  // do the grid wide reduction (find the max inverse timestep in the grid)
+  reduction_utilities::gridReduceMax(max_dti, dev_dti);
 }
 
 
@@ -514,10 +514,8 @@ __global__ void Calc_dt_2D(Real *dev_conserved, Real *dev_dti, Real gamma, int n
     }
   }
 
-  // do the block wide reduction (find the max inverse timestep in the block)
-  // then write it to that block's location in the dev_dti array
-  max_dti = reduction_utilities::blockReduceMax(max_dti);
-  if (threadIdx.x == 0) dev_dti[blockIdx.x] = max_dti;
+  // do the grid wide reduction (find the max inverse timestep in the grid)
+  reduction_utilities::gridReduceMax(max_dti, dev_dti);
 }
 
 
@@ -556,7 +554,7 @@ __global__ void Calc_dt_3D(Real *dev_conserved, Real *dev_dti, Real gamma, int n
       #ifdef  MHD
         // Compute the cell centered magnetic field using a straight average of
         // the faces
-        mhdUtils::cellCenteredMagneticFields(dev_conserved, id, xid, yid, zid, n_cells, nx, ny, avgBx, avgBy, avgBz);
+        mhd::utils::cellCenteredMagneticFields(dev_conserved, id, xid, yid, zid, n_cells, nx, ny, avgBx, avgBy, avgBz);
       #endif  //MHD
 
       // Compute the maximum inverse crossing time in the cell
@@ -569,62 +567,44 @@ __global__ void Calc_dt_3D(Real *dev_conserved, Real *dev_dti, Real gamma, int n
     }
   }
 
-  // do the block wide reduction (find the max inverse timestep in the block)
-  // then write it to that block's location in the dev_dti array
-  max_dti = reduction_utilities::blockReduceMax(max_dti);
-  if (threadIdx.x == 0) dev_dti[blockIdx.x] = max_dti;
+  // do the grid wide reduction (find the max inverse timestep in the grid)
+  reduction_utilities::gridReduceMax(max_dti, dev_dti);
 }
 
 Real Calc_dt_GPU(Real *dev_conserved, int nx, int ny, int nz, int n_ghost, int n_fields, Real dx, Real dy, Real dz, Real gamma )
 {
-  // set values for GPU kernels
-  uint threadsPerBlock, numBlocks;
-  int ngrid = (nx*ny*nz + TPB - 1 )/TPB;
-  // reduction_utilities::reductionLaunchParams(numBlocks, threadsPerBlock); // Uncomment this if we fix the AtomicDouble bug - Alwin
-  threadsPerBlock = TPB;
-  numBlocks = ngrid;
-
-  Real* dev_dti = dev_dti_array;
+  // Allocate the device memory
+  cuda_utilities::DeviceVector<Real> static dev_dti(1);
 
+  // Set the device side inverse time step to the smallest possible double so
+  // that the reduction isn't using the maximum value of the previous iteration
+  dev_dti.assign(std::numeric_limits<double>::lowest());
 
   // compute dt and store in dev_dti
   if (nx > 1 && ny == 1 && nz == 1) //1D
   {
-    hipLaunchKernelGGL(Calc_dt_1D, numBlocks, threadsPerBlock, 0, 0, dev_conserved, dev_dti, gamma, n_ghost, nx, dx);
+    // set launch parameters for GPU kernels.
+    cuda_utilities::AutomaticLaunchParams static const launchParams(Calc_dt_1D);
+    hipLaunchKernelGGL(Calc_dt_1D, launchParams.numBlocks, launchParams.threadsPerBlock, 0, 0,
+                       dev_conserved, dev_dti.data(), gamma, n_ghost, nx, dx);
   }
   else if (nx > 1 && ny > 1 && nz == 1) //2D
   {
-    hipLaunchKernelGGL(Calc_dt_2D, numBlocks, threadsPerBlock, 0, 0, dev_conserved, dev_dti, gamma, n_ghost, nx, ny, dx, dy);
+    // set launch parameters for GPU kernels.
+    cuda_utilities::AutomaticLaunchParams static const launchParams(Calc_dt_2D);
+    hipLaunchKernelGGL(Calc_dt_2D, launchParams.numBlocks, launchParams.threadsPerBlock, 0, 0,
+                       dev_conserved, dev_dti.data(), gamma, n_ghost, nx, ny, dx, dy);
   }
   else if (nx > 1 && ny > 1 && nz > 1) //3D
   {
-    hipLaunchKernelGGL(Calc_dt_3D, numBlocks, threadsPerBlock, 0, 0, dev_conserved, dev_dti, gamma, n_ghost, n_fields, nx, ny, nz, dx, dy, dz);
+    // set launch parameters for GPU kernels.
+    cuda_utilities::AutomaticLaunchParams static const launchParams(Calc_dt_3D);
+    hipLaunchKernelGGL(Calc_dt_3D, launchParams.numBlocks, launchParams.threadsPerBlock, 0, 0,
+                       dev_conserved, dev_dti.data(), gamma, n_ghost, n_fields, nx, ny, nz, dx, dy, dz);
   }
   CudaCheckError();
 
-  Real max_dti=0;
-
-  /* Uncomment the below if we fix the AtomicDouble bug - Alwin
-  // copy device side max_dti to host side max_dti
-
-
-  CudaSafeCall( cudaMemcpy(&max_dti, dev_dti, sizeof(Real), cudaMemcpyDeviceToHost) );
-  cudaDeviceSynchronize();
-
-  return max_dti;
-  */
-
-  int dev_dti_length = numBlocks;
-  CudaSafeCall(cudaMemcpy(host_dti_array,dev_dti, dev_dti_length*sizeof(Real), cudaMemcpyDeviceToHost));
-  cudaDeviceSynchronize();
-
-  for (int i=0;i<dev_dti_length;i++){
-    max_dti = fmax(max_dti,host_dti_array[i]);
-  }
-
-  return max_dti;
-
-  
+  return dev_dti[0];
 }
 
 
@@ -653,7 +633,7 @@ __global__ void Average_Slow_Cells_3D(Real *dev_conserved, int nx, int ny, int n
   #ifdef  MHD
     Real avgBx, avgBy, avgBz;
   #endif  //MHD
-  
+
   // get a global thread ID
   id = threadIdx.x + blockIdx.x * blockDim.x;
   n_cells = nx*ny*nz;
@@ -682,20 +662,20 @@ __global__ void Average_Slow_Cells_3D(Real *dev_conserved, int nx, int ny, int n
     #else  // not MHD
       max_dti = hydroInverseCrossingTime(E, d, d_inv, vx, vy, vz, dx, dy, dz, gamma);
     #endif  //MHD
-    
+
     if (max_dti > max_dti_slow){
       speed = sqrt(vx*vx + vy*vy + vz*vz);
       temp = (gamma - 1)*(E - 0.5*(speed*speed)*d)*ENERGY_UNIT/(d*DENSITY_UNIT/0.6/MP)/KB;
       P  = (E - 0.5*d*(vx*vx + vy*vy + vz*vz)) * (gamma - 1.0);
       cs = sqrt(d_inv * gamma * P)*VELOCITY_UNIT*1e-5;
       // Average this cell
-      printf(" Average Slow Cell [ %d %d %d ] -> dt_cell=%f    dt_min=%f, n=%.3e, T=%.3e, v=%.3e (%.3e, %.3e, %.3e), cs=%.3e\n", xid, yid, zid, 1./max_dti,  1./max_dti_slow, 
+      printf(" Average Slow Cell [ %d %d %d ] -> dt_cell=%f    dt_min=%f, n=%.3e, T=%.3e, v=%.3e (%.3e, %.3e, %.3e), cs=%.3e\n", xid, yid, zid, 1./max_dti,  1./max_dti_slow,
                  dev_conserved[id]*DENSITY_UNIT/0.6/MP, temp, speed*VELOCITY_UNIT*1e-5, vx*VELOCITY_UNIT*1e-5, vy*VELOCITY_UNIT*1e-5, vz*VELOCITY_UNIT*1e-5, cs);
       Average_Cell_All_Fields( xid, yid, zid, nx, ny, nz, n_cells, n_fields, dev_conserved );
     }
   }
 }
-#endif //AVERAGE_SLOW_CELLS    
+#endif //AVERAGE_SLOW_CELLS
 
 
 #ifdef DE
@@ -829,7 +809,13 @@ __global__ void Partial_Update_Advected_Internal_Energy_3D( Real *dev_conserved,
     //PRESSURE_DE
     E = dev_conserved[4*n_cells + id];
     GE = dev_conserved[(n_fields-1)*n_cells + id];
-    E_kin = 0.5 * d * ( vx*vx + vy*vy + vz*vz );
+    E_kin = hydro_utilities::Calc_Kinetic_Energy_From_Velocity(d, vx, vy, vz);
+    #ifdef  MHD
+      // Add the magnetic energy
+      Real centeredBx, centeredBy, centeredBz;
+      mhd::utils::cellCenteredMagneticFields(dev_conserved, id, xid, yid, zid, n_cells, nx, ny, centeredBx, centeredBy, centeredBz)
+      E_kin += mhd::utils::computeMagneticEnergy(magX, magY, magZ);
+    #endif  //MHD
     P = hydro_utilities::Get_Pressure_From_DE( E, E - E_kin, GE, gamma );
     P  = fmax(P, (Real) TINY_NUMBER);
 
diff --git a/src/hydro/hydro_cuda_tests.cu b/src/hydro/hydro_cuda_tests.cu
index a6d00e96b..eb9c3f9ed 100644
--- a/src/hydro/hydro_cuda_tests.cu
+++ b/src/hydro/hydro_cuda_tests.cu
@@ -19,6 +19,7 @@
 #include "../global/global_cuda.h"
 #include "../utils/gpu.hpp"
 #include "../utils/testing_utilities.h"
+#include "../utils/DeviceVector.h"
 #include "../hydro/hydro_cuda.h"   // Include code to test
 
 #if defined(CUDA)
@@ -44,38 +45,31 @@ TEST(tHYDROCalcDt3D, CorrectInputExpectCorrectOutput)
   Real dx = 1.0;
   Real dy = 1.0;
   Real dz = 1.0;
-  Real *host_conserved;
-  Real *dev_conserved;
-  Real *dev_dti_array;
+  std::vector<Real> host_conserved(n_fields);
+  cuda_utilities::DeviceVector<Real> dev_conserved(n_fields);
+  cuda_utilities::DeviceVector<Real> dev_dti(1);
   Real gamma = 5.0/3.0;
 
-  // Allocate host and device arrays and copy data
-  cudaHostAlloc(&host_conserved, n_fields*sizeof(Real), cudaHostAllocDefault);
-  CudaSafeCall(cudaMalloc(&dev_conserved, n_fields*sizeof(Real)));
-  CudaSafeCall(cudaMalloc(&dev_dti_array, sizeof(Real)));
-
   // Set values of conserved variables for input (host)
-  host_conserved[0] = 1.0; // density
-  host_conserved[1] = 0.0; // x momentum
-  host_conserved[2] = 0.0; // y momentum
-  host_conserved[3] = 0.0; // z momentum
-  host_conserved[4] = 1.0; // Energy
+  host_conserved.at(0) = 1.0; // density
+  host_conserved.at(1) = 0.0; // x momentum
+  host_conserved.at(2) = 0.0; // y momentum
+  host_conserved.at(3) = 0.0; // z momentum
+  host_conserved.at(4) = 1.0; // Energy
 
   // Copy host data to device arrray
-  CudaSafeCall(cudaMemcpy(dev_conserved, host_conserved, n_fields*sizeof(Real), cudaMemcpyHostToDevice));
-  //__global__ void Calc_dt_3D(Real *dev_conserved, Real *dev_dti, Real gamma, int n_ghost, int n_fields, int nx, int ny, int nz, Real dx, Real dy, Real dz)                        
+  dev_conserved.cpyHostToDevice(host_conserved);
 
   // Run the kernel
-  hipLaunchKernelGGL(Calc_dt_3D, dim1dGrid, dim1dBlock, 0, 0, dev_conserved, dev_dti_array, gamma, n_ghost, n_fields, nx, ny, nz, dx, dy, dz);
+  hipLaunchKernelGGL(Calc_dt_3D, dim1dGrid, dim1dBlock, 0, 0,
+                     dev_conserved.data(), dev_dti.data(), gamma, n_ghost,
+                     n_fields, nx, ny, nz, dx, dy, dz);
   CudaCheckError();
 
-  // Copy the dt value back from the GPU
-  CudaSafeCall(cudaMemcpy(testDt, dev_dti_array, sizeof(Real), cudaMemcpyDeviceToHost));
-
   // Compare results
   // Check for equality and if not equal return difference
-  double fiducialDt = 1.0540925533894598;
-  double testData = testDt[0];
+  double const fiducialDt = 1.0540925533894598;
+  double const testData = dev_dti.at(0);
   double absoluteDiff;
   int64_t ulpsDiff;
   bool areEqual;
diff --git a/src/integrators/VL_3D_cuda.cu b/src/integrators/VL_3D_cuda.cu
index 097708ede..2d23cc636 100644
--- a/src/integrators/VL_3D_cuda.cu
+++ b/src/integrators/VL_3D_cuda.cu
@@ -1,8 +1,7 @@
 /*! \file VL_3D_cuda.cu
- *  \brief Definitions of the cuda 3D VL algorithm functions. */
+ *  \brief Definitions of the cuda 3 D VL algorithm functions. */
 
-#ifdef CUDA
-#ifdef VL
+#if  defined(CUDA) && defined(VL)
 
 #include <stdio.h>
 #include <stdlib.h>
@@ -21,8 +20,11 @@
 #include "../riemann_solvers/exact_cuda.h"
 #include "../riemann_solvers/roe_cuda.h"
 #include "../riemann_solvers/hllc_cuda.h"
-#include "../io/io.h"
 #include "../riemann_solvers/hll_cuda.h"
+#include "../riemann_solvers/hlld_cuda.h"
+#include "../mhd/ct_electric_fields.h"
+#include "../mhd/magnetic_update.h"
+#include "../io/io.h"
 
 __global__ void Update_Conserved_Variables_3D_half(Real *dev_conserved, Real *dev_conserved_half, Real *dev_F_x, Real *dev_F_y,  Real *dev_F_z, int nx, int ny, int nz, int n_ghost, Real dx, Real dy, Real dz, Real dt, Real gamma, int n_fields, Real density_floor);
 
@@ -33,7 +35,6 @@ void VL_Algorithm_3D_CUDA(Real *d_conserved, Real *d_grav_potential, int nx, int
     Real ybound, Real zbound, Real dt, int n_fields, Real density_floor,
     Real U_floor, Real *host_grav_potential )
 {
-
   //Here, *dev_conserved contains the entire
   //set of conserved variables on the grid
   //concatenated into a 1-d array
@@ -53,42 +54,87 @@ void VL_Algorithm_3D_CUDA(Real *d_conserved, Real *d_grav_potential, int nx, int
   if ( !memory_allocated ){
 
     // allocate memory on the GPU
-    //CudaSafeCall( cudaMalloc((void**)&dev_conserved, n_fields*n_cells*sizeof(Real)) );
     dev_conserved = d_conserved;
+
+    // Set the size of the interface and flux arrays
+    #ifdef  MHD
+      // In MHD/Constrained Transport the interface arrays have one fewer fields
+      // since the magnetic field that is stored on the face does not require
+      // reconstructions. Similarly the fluxes have one fewer fields since the
+      // magnetic field on that face doesn't have an associated flux. Each
+      // interface array store the magnetic fields on that interface that are
+      // not perpendicular to the interface and arranged cyclically. I.e. the
+      // `Q_Lx` interface store the reconstructed Y and Z magnetic fields in
+      // that order, the `Q_Ly` interface stores the Z and X mangetic fields in
+      // that order, and the `Q_Lz` interface stores the X and Y magnetic fields
+      // in that order. These fields start at the (5+NSCALARS)*n_cells and
+      // (6+NSCALARS)*n_cells locations respectively. The interface state arrays
+      // store in the interface on the "right" side of the cell, so the flux
+      // arrays store the fluxes through the right interface
+      //
+      // According to the source code of Athena, the following equation relate
+      // the magnetic flux to the face centered electric fields/EMF.
+      // -cross(V,B)x is the negative of the x-component of V cross B. Note that
+      // "X" is the direction the solver is running in this case, not
+      // necessarily the true "X".
+      //  F_x[(5+NSCALARS)*n_cells] = VxBy - BxVy = -(-cross(V,B))z = -EMF_Z
+      //  F_x[(6+NSCALARS)*n_cells] = VxBz - BxVz =  (-cross(V,B))y =  EMF_Y
+      //  F_y[(5+NSCALARS)*n_cells] = VxBy - BxVy = -(-cross(V,B))z = -EMF_X
+      //  F_y[(6+NSCALARS)*n_cells] = VxBz - BxVz =  (-cross(V,B))y =  EMF_Z
+      //  F_z[(5+NSCALARS)*n_cells] = VxBy - BxVy = -(-cross(V,B))z = -EMF_Y
+      //  F_z[(6+NSCALARS)*n_cells] = VxBz - BxVz =  (-cross(V,B))y =  EMF_X
+      size_t const arraySize   = (n_fields-1) * n_cells * sizeof(Real);
+      size_t const ctArraySize =            3 * n_cells * sizeof(Real);
+    #else  // not MHD
+      size_t const arraySize = n_fields*n_cells*sizeof(Real);
+    #endif  //MHD
     CudaSafeCall( cudaMalloc((void**)&dev_conserved_half, n_fields*n_cells*sizeof(Real)) );
-    CudaSafeCall( cudaMalloc((void**)&Q_Lx,  n_fields*n_cells*sizeof(Real)) );
-    CudaSafeCall( cudaMalloc((void**)&Q_Rx,  n_fields*n_cells*sizeof(Real)) );
-    CudaSafeCall( cudaMalloc((void**)&Q_Ly,  n_fields*n_cells*sizeof(Real)) );
-    CudaSafeCall( cudaMalloc((void**)&Q_Ry,  n_fields*n_cells*sizeof(Real)) );
-    CudaSafeCall( cudaMalloc((void**)&Q_Lz,  n_fields*n_cells*sizeof(Real)) );
-    CudaSafeCall( cudaMalloc((void**)&Q_Rz,  n_fields*n_cells*sizeof(Real)) );
-    CudaSafeCall( cudaMalloc((void**)&F_x,   n_fields*n_cells*sizeof(Real)) );
-    CudaSafeCall( cudaMalloc((void**)&F_y,   n_fields*n_cells*sizeof(Real)) );
-    CudaSafeCall( cudaMalloc((void**)&F_z,   n_fields*n_cells*sizeof(Real)) );
+    CudaSafeCall( cudaMalloc((void**)&Q_Lx,  arraySize) );
+    CudaSafeCall( cudaMalloc((void**)&Q_Rx,  arraySize) );
+    CudaSafeCall( cudaMalloc((void**)&Q_Ly,  arraySize) );
+    CudaSafeCall( cudaMalloc((void**)&Q_Ry,  arraySize) );
+    CudaSafeCall( cudaMalloc((void**)&Q_Lz,  arraySize) );
+    CudaSafeCall( cudaMalloc((void**)&Q_Rz,  arraySize) );
+    CudaSafeCall( cudaMalloc((void**)&F_x,   arraySize) );
+    CudaSafeCall( cudaMalloc((void**)&F_y,   arraySize) );
+    CudaSafeCall( cudaMalloc((void**)&F_z,   arraySize) );
+
+    cuda_utilities::initGpuMemory(dev_conserved_half, n_fields*n_cells*sizeof(Real));
+    cuda_utilities::initGpuMemory(Q_Lx, arraySize);
+    cuda_utilities::initGpuMemory(Q_Rx, arraySize);
+    cuda_utilities::initGpuMemory(Q_Ly, arraySize);
+    cuda_utilities::initGpuMemory(Q_Ry, arraySize);
+    cuda_utilities::initGpuMemory(Q_Lz, arraySize);
+    cuda_utilities::initGpuMemory(Q_Rz, arraySize);
+    cuda_utilities::initGpuMemory(F_x, arraySize);
+    cuda_utilities::initGpuMemory(F_y, arraySize);
+    cuda_utilities::initGpuMemory(F_z, arraySize);
+
+    #ifdef  MHD
+      CudaSafeCall( cudaMalloc((void**)&ctElectricFields, ctArraySize) );
+      cuda_utilities::initGpuMemory(ctElectricFields, ctArraySize);
+    #endif  //MHD
 
     #if defined( GRAVITY )
-    // CudaSafeCall( cudaMalloc((void**)&dev_grav_potential, n_cells*sizeof(Real)) );
     dev_grav_potential = d_grav_potential;
-    #else
+    #else  // not GRAVITY
     dev_grav_potential = NULL;
-    #endif
+    #endif  //GRAVITY
 
     // If memory is single allocated: memory_allocated becomes true and successive timesteps won't allocate memory.
     // If the memory is not single allocated: memory_allocated remains Null and memory is allocated every timestep.
     memory_allocated = true;
-
   }
 
     #if defined( GRAVITY ) && !defined( GRAVITY_GPU )
     CudaSafeCall( cudaMemcpy(dev_grav_potential, temp_potential, n_cells*sizeof(Real), cudaMemcpyHostToDevice) );
-    #endif
+    #endif  //GRAVITY and GRAVITY_GPU
 
 
     // Step 1: Use PCM reconstruction to put primitive variables into interface arrays
     hipLaunchKernelGGL(PCM_Reconstruction_3D, dim1dGrid, dim1dBlock, 0, 0, dev_conserved, Q_Lx, Q_Rx, Q_Ly, Q_Ry, Q_Lz, Q_Rz, nx, ny, nz, n_ghost, gama, n_fields);
     CudaCheckError();
 
-
     // Step 2: Calculate first-order upwind fluxes
     #ifdef EXACT
     hipLaunchKernelGGL(Calculate_Exact_Fluxes_CUDA, dim1dGrid, dim1dBlock, 0, 0, Q_Lx, Q_Rx, F_x, nx, ny, nz, n_ghost, gama, 0, n_fields);
@@ -110,18 +156,32 @@ void VL_Algorithm_3D_CUDA(Real *d_conserved, Real *d_grav_potential, int nx, int
     hipLaunchKernelGGL(Calculate_HLL_Fluxes_CUDA, dim1dGrid, dim1dBlock, 0, 0, Q_Ly, Q_Ry, F_y, nx, ny, nz, n_ghost, gama, 1, n_fields);
     hipLaunchKernelGGL(Calculate_HLL_Fluxes_CUDA, dim1dGrid, dim1dBlock, 0, 0, Q_Lz, Q_Rz, F_z, nx, ny, nz, n_ghost, gama, 2, n_fields);
     #endif //HLL
+    #ifdef HLLD
+    hipLaunchKernelGGL(mhd::Calculate_HLLD_Fluxes_CUDA, dim1dGrid, dim1dBlock, 0, 0, Q_Lx, Q_Rx, &(dev_conserved[(5 + NSCALARS) * n_cells]), F_x, nx, ny, nz, n_ghost, gama, 0, n_fields);
+    hipLaunchKernelGGL(mhd::Calculate_HLLD_Fluxes_CUDA, dim1dGrid, dim1dBlock, 0, 0, Q_Ly, Q_Ry, &(dev_conserved[(6 + NSCALARS) * n_cells]), F_y, nx, ny, nz, n_ghost, gama, 1, n_fields);
+    hipLaunchKernelGGL(mhd::Calculate_HLLD_Fluxes_CUDA, dim1dGrid, dim1dBlock, 0, 0, Q_Lz, Q_Rz, &(dev_conserved[(7 + NSCALARS) * n_cells]), F_z, nx, ny, nz, n_ghost, gama, 2, n_fields);
+    #endif //HLLD
     CudaCheckError();
 
+    #ifdef  MHD
+      // Step 2.5: Compute the Constrained transport electric fields
+      hipLaunchKernelGGL(mhd::Calculate_CT_Electric_Fields, dim1dGrid, dim1dBlock, 0, 0, F_x, F_y, F_z, dev_conserved, ctElectricFields, nx, ny, nz, n_cells);
+      CudaCheckError();
+    #endif  //MHD
 
     // Step 3: Update the conserved variables half a timestep
     hipLaunchKernelGGL(Update_Conserved_Variables_3D_half, dim1dGrid, dim1dBlock, 0, 0, dev_conserved, dev_conserved_half, F_x, F_y, F_z, nx, ny, nz, n_ghost, dx, dy, dz, 0.5*dt, gama, n_fields, density_floor );
     CudaCheckError();
-
+    #ifdef  MHD
+      // Update the magnetic fields
+      hipLaunchKernelGGL(mhd::Update_Magnetic_Field_3D, dim1dGrid, dim1dBlock, 0, 0, dev_conserved, dev_conserved_half, ctElectricFields, nx, ny, nz, n_cells, 0.5*dt, dx, dy, dz);
+      CudaCheckError();
+    #endif  //MHD
 
     // Step 4: Construct left and right interface values using updated conserved variables
     #ifdef PCM
     hipLaunchKernelGGL(PCM_Reconstruction_3D, dim1dGrid, dim1dBlock, 0, 0, dev_conserved_half, Q_Lx, Q_Rx, Q_Ly, Q_Ry, Q_Lz, Q_Rz, nx, ny, nz, n_ghost, gama, n_fields);
-    #endif
+    #endif  //PCM
     #ifdef PLMP
     hipLaunchKernelGGL(PLMP_cuda, dim1dGrid, dim1dBlock, 0, 0, dev_conserved_half, Q_Lx, Q_Rx, nx, ny, nz, n_ghost, dx, dt, gama, 0, n_fields);
     hipLaunchKernelGGL(PLMP_cuda, dim1dGrid, dim1dBlock, 0, 0, dev_conserved_half, Q_Ly, Q_Ry, nx, ny, nz, n_ghost, dy, dt, gama, 1, n_fields);
@@ -131,7 +191,7 @@ void VL_Algorithm_3D_CUDA(Real *d_conserved, Real *d_grav_potential, int nx, int
     hipLaunchKernelGGL(PLMC_cuda, dim1dGrid, dim1dBlock, 0, 0, dev_conserved_half, Q_Lx, Q_Rx, nx, ny, nz, n_ghost, dx, dt, gama, 0, n_fields);
     hipLaunchKernelGGL(PLMC_cuda, dim1dGrid, dim1dBlock, 0, 0, dev_conserved_half, Q_Ly, Q_Ry, nx, ny, nz, n_ghost, dy, dt, gama, 1, n_fields);
     hipLaunchKernelGGL(PLMC_cuda, dim1dGrid, dim1dBlock, 0, 0, dev_conserved_half, Q_Lz, Q_Rz, nx, ny, nz, n_ghost, dz, dt, gama, 2, n_fields);
-    #endif
+    #endif  //PLMC
     #ifdef PPMP
     hipLaunchKernelGGL(PPMP_cuda, dim1dGrid, dim1dBlock, 0, 0, dev_conserved_half, Q_Lx, Q_Rx, nx, ny, nz, n_ghost, dx, dt, gama, 0, n_fields);
     hipLaunchKernelGGL(PPMP_cuda, dim1dGrid, dim1dBlock, 0, 0, dev_conserved_half, Q_Ly, Q_Ry, nx, ny, nz, n_ghost, dy, dt, gama, 1, n_fields);
@@ -166,29 +226,46 @@ void VL_Algorithm_3D_CUDA(Real *d_conserved, Real *d_grav_potential, int nx, int
     hipLaunchKernelGGL(Calculate_HLL_Fluxes_CUDA, dim1dGrid, dim1dBlock, 0, 0, Q_Ly, Q_Ry, F_y, nx, ny, nz, n_ghost, gama, 1, n_fields);
     hipLaunchKernelGGL(Calculate_HLL_Fluxes_CUDA, dim1dGrid, dim1dBlock, 0, 0, Q_Lz, Q_Rz, F_z, nx, ny, nz, n_ghost, gama, 2, n_fields);
     #endif //HLLC
+    #ifdef HLLD
+    hipLaunchKernelGGL(mhd::Calculate_HLLD_Fluxes_CUDA, dim1dGrid, dim1dBlock, 0, 0, Q_Lx, Q_Rx, &(dev_conserved_half[(5 + NSCALARS) * n_cells]), F_x, nx, ny, nz, n_ghost, gama, 0, n_fields);
+    hipLaunchKernelGGL(mhd::Calculate_HLLD_Fluxes_CUDA, dim1dGrid, dim1dBlock, 0, 0, Q_Ly, Q_Ry, &(dev_conserved_half[(6 + NSCALARS) * n_cells]), F_y, nx, ny, nz, n_ghost, gama, 1, n_fields);
+    hipLaunchKernelGGL(mhd::Calculate_HLLD_Fluxes_CUDA, dim1dGrid, dim1dBlock, 0, 0, Q_Lz, Q_Rz, &(dev_conserved_half[(7 + NSCALARS) * n_cells]), F_z, nx, ny, nz, n_ghost, gama, 2, n_fields);
+    #endif //HLLD
     CudaCheckError();
 
     #ifdef DE
     // Compute the divergence of Vel before updating the conserved array, this solves synchronization issues when adding this term on Update_Conserved_Variables_3D
     hipLaunchKernelGGL(Partial_Update_Advected_Internal_Energy_3D, dim1dGrid, dim1dBlock, 0, 0,  dev_conserved, Q_Lx, Q_Rx, Q_Ly, Q_Ry, Q_Lz, Q_Rz, nx, ny, nz, n_ghost, dx, dy, dz,  dt, gama, n_fields );
     CudaCheckError();
-    #endif
+    #endif  //DE
 
+    #ifdef  MHD
+    // Step 5.5: Compute the Constrained transport electric fields
+    hipLaunchKernelGGL(mhd::Calculate_CT_Electric_Fields, dim1dGrid, dim1dBlock, 0, 0, F_x, F_y, F_z, dev_conserved_half, ctElectricFields, nx, ny, nz, n_cells);
+    CudaCheckError();
+    #endif  //MHD
 
     // Step 6: Update the conserved variable array
     hipLaunchKernelGGL(Update_Conserved_Variables_3D, dim1dGrid, dim1dBlock, 0, 0, dev_conserved, Q_Lx, Q_Rx, Q_Ly, Q_Ry, Q_Lz, Q_Rz, F_x, F_y, F_z, nx, ny, nz, x_off, y_off, z_off, n_ghost, dx, dy, dz, xbound, ybound, zbound, dt, gama, n_fields, density_floor, dev_grav_potential);
     CudaCheckError();
 
+    #ifdef  MHD
+    // Update the magnetic fields
+    hipLaunchKernelGGL(mhd::Update_Magnetic_Field_3D, dim1dGrid, dim1dBlock, 0, 0, dev_conserved, dev_conserved, ctElectricFields, nx, ny, nz, n_cells, dt, dx, dy, dz);
+    CudaCheckError();
+    #endif  //MHD
+
     #ifdef DE
     hipLaunchKernelGGL(Select_Internal_Energy_3D, dim1dGrid, dim1dBlock, 0, 0, dev_conserved, nx, ny, nz, n_ghost, n_fields);
     hipLaunchKernelGGL(Sync_Energies_3D, dim1dGrid, dim1dBlock, 0, 0, dev_conserved, nx, ny, nz, n_ghost, gama, n_fields);
     CudaCheckError();
-    #endif
+    #endif  //DE
 
     #ifdef TEMPERATURE_FLOOR
     hipLaunchKernelGGL(Apply_Temperature_Floor, dim1dGrid, dim1dBlock, 0, 0, dev_conserved, nx, ny, nz, n_ghost, n_fields, U_floor );
     CudaCheckError();
     #endif //TEMPERATURE_FLOOR
+
   return;
 
 }
@@ -208,6 +285,7 @@ void Free_Memory_VL_3D(){
   cudaFree(F_x);
   cudaFree(F_y);
   cudaFree(F_z);
+  cudaFree(ctElectricFields);
 
 }
 
@@ -233,11 +311,11 @@ __global__ void Update_Conserved_Variables_3D_half(Real *dev_conserved, Real *de
   Real d, d_inv, vx, vy, vz;
   Real vx_imo, vx_ipo, vy_jmo, vy_jpo, vz_kmo, vz_kpo, P, E, E_kin, GE;
   int ipo, jpo, kpo;
-  #endif
+  #endif  //DE
 
   #ifdef DENSITY_FLOOR
   Real dens_0;
-  #endif
+  #endif  //DENSITY_FLOOR
 
   // threads corresponding to all cells except outer ring of ghost cells do the calculation
   if (xid > 0 && xid < nx-1 && yid > 0 && yid < ny-1 && zid > 0 && zid < nz-1)
@@ -251,7 +329,13 @@ __global__ void Update_Conserved_Variables_3D_half(Real *dev_conserved, Real *de
     //PRESSURE_DE
     E = dev_conserved[4*n_cells + id];
     GE = dev_conserved[(n_fields-1)*n_cells + id];
-    E_kin = 0.5 * d * ( vx*vx + vy*vy + vz*vz );
+    E_kin = hydro_utilities::Calc_Kinetic_Energy_From_Velocity(d, vx, vy, vz);
+    #ifdef  MHD
+      // Add the magnetic energy
+      Real centeredBx, centeredBy, centeredBz;
+      mhd::utils::cellCenteredMagneticFields(dev_conserved, id, xid, yid, zid, n_cells, nx, ny, centeredBx, centeredBy, centeredBz)
+      E_kin += mhd::utils::computeMagneticEnergy(centeredBx, centeredBy, centeredBz);
+    #endif  //MHD
     P = hydro_utilities::Get_Pressure_From_DE( E, E - E_kin, GE, gamma );
     P  = fmax(P, (Real) TINY_NUMBER);
     // P  = (dev_conserved[4*n_cells + id] - 0.5*d*(vx*vx + vy*vy + vz*vz)) * (gamma - 1.0);
@@ -266,7 +350,7 @@ __global__ void Update_Conserved_Variables_3D_half(Real *dev_conserved, Real *de
     vy_jpo = dev_conserved[2*n_cells + jpo] / dev_conserved[jpo];
     vz_kmo = dev_conserved[3*n_cells + kmo] / dev_conserved[kmo];
     vz_kpo = dev_conserved[3*n_cells + kpo] / dev_conserved[kpo];
-    #endif
+    #endif  //DE
 
     // update the conserved variable array
     dev_conserved_half[            id] = dev_conserved[            id]
@@ -296,14 +380,14 @@ __global__ void Update_Conserved_Variables_3D_half(Real *dev_conserved, Real *de
                                          + dtody * (dev_F_y[(5+i)*n_cells + jmo] - dev_F_y[(5+i)*n_cells + id])
                                          + dtodz * (dev_F_z[(5+i)*n_cells + kmo] - dev_F_z[(5+i)*n_cells + id]);
     }
-    #endif
+    #endif  //SCALAR
     #ifdef DE
     dev_conserved_half[(n_fields-1)*n_cells + id] = dev_conserved[(n_fields-1)*n_cells + id]
                                        + dtodx * (dev_F_x[(n_fields-1)*n_cells + imo] - dev_F_x[(n_fields-1)*n_cells + id])
                                        + dtody * (dev_F_y[(n_fields-1)*n_cells + jmo] - dev_F_y[(n_fields-1)*n_cells + id])
                                        + dtodz * (dev_F_z[(n_fields-1)*n_cells + kmo] - dev_F_z[(n_fields-1)*n_cells + id])
                                        + 0.5*P*(dtodx*(vx_imo-vx_ipo) + dtody*(vy_jmo-vy_jpo) + dtodz*(vz_kmo-vz_kpo));
-    #endif
+    #endif  //DE
 
     #ifdef DENSITY_FLOOR
     if ( dev_conserved_half[            id] < density_floor ){
@@ -317,19 +401,11 @@ __global__ void Update_Conserved_Variables_3D_half(Real *dev_conserved, Real *de
       dev_conserved_half[4*n_cells + id] *= (density_floor / dens_0);
       #ifdef DE
       dev_conserved_half[(n_fields-1)*n_cells + id] *= (density_floor / dens_0);
-      #endif
+      #endif  //DE
     }
-    #endif
-    //if (dev_conserved_half[id] < 0.0 || dev_conserved_half[id] != dev_conserved_half[id] || dev_conserved_half[4*n_cells+id] < 0.0 || dev_conserved_half[4*n_cells+id] != dev_conserved_half[4*n_cells+id]) {
-      //printf("%3d %3d %3d Thread crashed in half step update. d: %e E: %e\n", xid, yid, zid, dev_conserved_half[id], dev_conserved_half[4*n_cells+id]);
-    //}
-
+    #endif  //DENSITY_FLOOR
   }
 
 }
 
-
-
-
-#endif //VL
-#endif //CUDA
+#endif //CUDA and VL
diff --git a/src/io/io.h b/src/io/io.h
index f7dfe6eb7..08489f7da 100644
--- a/src/io/io.h
+++ b/src/io/io.h
@@ -3,6 +3,8 @@
 #include "../global/global.h"
 #include "../grid/grid3D.h"
 #include <iostream>
+#include <sstream>
+#include <iomanip>
 
 
 /* Write the data */
@@ -26,6 +28,23 @@ void OutputSlices(Grid3D &G, struct parameters P, int nfile);
 /* MPI-safe printf routine */
 int chprintf(const char * __restrict sdata, ...);
 
+/*!
+ * \brief Convert a floating point number to a string such that it can be
+ * exactly deserialized back from a string to the same floating point number.
+ *
+ * \tparam T Any floating point type
+ * \param[in] input The floating point number to convert
+ * \return std::string The string representation of the input floating point
+ */
+template<typename T>
+std::string to_string_exact(T const &input)
+{
+    std::stringstream output;
+    output << std::setprecision(std::numeric_limits<T>::max_digits10);
+    output << input;
+    return output.str();
+}
+
 void Create_Log_File( struct parameters P );
 
 void Write_Message_To_Log_File( const char* message );
diff --git a/src/main.cpp b/src/main.cpp
index da2348858..5ee396965 100644
--- a/src/main.cpp
+++ b/src/main.cpp
@@ -17,7 +17,7 @@
 #include "particles/supernova.h"
 #ifdef ANALYSIS
 #include "analysis/feedback_analysis.h"
-#endif 
+#endif
 #endif //SUPERNOVA
 #ifdef STAR_FORMATION
 #include "particles/star_formation.h"
@@ -53,7 +53,6 @@ int main(int argc, char *argv[])
   int nfile = 0; // number of output files
   Real outtime = 0; // current output time
 
-
   // read in command line arguments
   if (argc < 2)
   {
@@ -191,6 +190,12 @@ int main(int argc, char *argv[])
   // add one to the output file count
   nfile++;
   #endif //OUTPUT
+
+  #ifdef  MHD
+    // Check that the initial magnetic field has zero divergence
+    G.checkMagneticDivergence(G, P, nfile);
+  #endif  //MHD
+
   // increment the next output time
   outtime += P.outstep;
 
@@ -254,7 +259,7 @@ int main(int argc, char *argv[])
 
     //Set the Grid boundary conditions for next time step
     G.Set_Boundary_Conditions_Grid(P);
-    
+
     #ifdef GRAVITY_ANALYTIC_COMP
     G.Add_Analytic_Potential();
     #endif
@@ -266,7 +271,7 @@ int main(int argc, char *argv[])
 
     #ifdef STAR_FORMATION
     star_formation::Star_Formation(G);
-    #endif 
+    #endif
 
     #ifdef CPU_TIME
     G.Timer.Total.End();
@@ -332,6 +337,10 @@ int main(int argc, char *argv[])
     }
     #endif
 
+    #ifdef  MHD
+      // Check that the magnetic field has zero divergence
+      G.checkMagneticDivergence(G, P, nfile);
+    #endif  //MHD
   } /*end loop over timesteps*/
 
 
diff --git a/src/mhd/ct_electric_fields.cu b/src/mhd/ct_electric_fields.cu
new file mode 100644
index 000000000..64a17bf52
--- /dev/null
+++ b/src/mhd/ct_electric_fields.cu
@@ -0,0 +1,340 @@
+/*!
+ * \file ct_electric_fields.cu
+ * \author Robert 'Bob' Caddy (rvc@pitt.edu)
+ * \brief Contains implementation for the CT electric fields code
+ *
+ */
+
+// STL Includes
+
+// External Includes
+
+// Local Includes
+#include "../mhd/ct_electric_fields.h"
+
+namespace mhd
+{
+   // =========================================================================
+   __global__ void Calculate_CT_Electric_Fields(Real const *fluxX,
+                                                Real const *fluxY,
+                                                Real const *fluxZ,
+                                                Real const *dev_conserved,
+                                                Real *ctElectricFields,
+                                                int const nx,
+                                                int const ny,
+                                                int const nz,
+                                                int const n_cells)
+    {
+        // get a thread index
+        int const threadId = threadIdx.x + blockIdx.x * blockDim.x;
+        int xid, yid, zid;
+        cuda_utilities::compute3DIndices(threadId, nx, ny, xid, yid, zid);
+
+        // Thread guard to avoid overrun and to skip the first two cells since
+        // those ghost cells can't be reconstructed
+        if (    xid > 1
+            and yid > 1
+            and zid > 1
+            and xid < nx
+            and yid < ny
+            and zid < nz)
+        {
+            // According to the source code of Athena, the following equation
+            // relate the magnetic flux to the face centered electric
+            // fields/EMF. -cross(V,B)x is the negative of the x-component of V
+            // cross B. Note that "X" is the direction the solver is running in
+            // this case, not necessarily the true "X".
+            //  F_x[(5+NSCALARS)*n_cells] = VxBy - BxVy = -(-cross(V,B))z = -EMF_Z
+            //  F_x[(6+NSCALARS)*n_cells] = VxBz - BxVz =  (-cross(V,B))y =  EMF_Y
+            //  F_y[(5+NSCALARS)*n_cells] = VxBy - BxVy = -(-cross(V,B))z = -EMF_X
+            //  F_y[(6+NSCALARS)*n_cells] = VxBz - BxVz =  (-cross(V,B))y =  EMF_Z
+            //  F_z[(5+NSCALARS)*n_cells] = VxBy - BxVy = -(-cross(V,B))z = -EMF_Y
+            //  F_z[(6+NSCALARS)*n_cells] = VxBz - BxVz =  (-cross(V,B))y =  EMF_X
+
+            // Notes on Implementation Details
+            // - The density flux has the same sign as the velocity on the face
+            //   and we only care about the sign so we're using the density flux
+            //   to perform upwinding checks
+            // - All slopes are computed without the factor of two shown in
+            //   Stone & Gardiner 2008 eqn. 24. That factor of two is taken care
+            //   of in the final assembly of the electric field
+
+            // Variable to get the sign of the velocity at the interface.
+            Real signUpwind;
+
+            // Slope and face variables. Format is
+            // "<slope/face>_<direction>_<pos/neg>". Slope/Face indicates if the
+            // value is a slope or a face centered EMF, direction indicates the
+            // direction of the derivative/face and pos/neg indicates if it's
+            // the slope on the positive or negative side of the edge field
+            // being computed. Note that the direction for the face is parallel
+            // to the face and the other direction that is parallel to that face
+            // is the direction of the electric field being calculated
+            Real slope_x_pos, slope_x_neg,
+                 slope_y_pos, slope_y_neg,
+                 slope_z_pos, slope_z_neg,
+                 face_x_pos,  face_x_neg,
+                 face_y_pos,  face_y_neg,
+                 face_z_pos,  face_z_neg;
+            // ================
+            // X electric field
+            // ================
+
+            // Y-direction slope on the positive Y side
+            signUpwind = fluxZ[cuda_utilities::compute1DIndex(xid, yid, zid-1, nx, ny)];
+            if (signUpwind > 0.0)
+            {
+                slope_y_pos = mhd::_internal::_ctSlope(fluxY, dev_conserved, -1, 0, 2, -1, 1, 2, xid, yid, zid, nx, ny, n_cells);
+            }
+            else if (signUpwind < 0.0)
+            {
+                slope_y_pos = mhd::_internal::_ctSlope(fluxY, dev_conserved, -1, 0, -1, -1, 1, -1, xid, yid, zid, nx, ny, n_cells);
+            }
+            else
+            {
+                slope_y_pos = 0.5 * (mhd::_internal::_ctSlope(fluxY, dev_conserved, -1, 0,  2, -1, 1,  2, xid, yid, zid, nx, ny, n_cells)
+                                   + mhd::_internal::_ctSlope(fluxY, dev_conserved, -1, 0, -1, -1, 1, -1, xid, yid, zid, nx, ny, n_cells));
+            }
+
+            // Y-direction slope on the negative Y side
+            signUpwind = fluxZ[cuda_utilities::compute1DIndex(xid, yid-1, zid-1, nx, ny)];
+            if (signUpwind > 0.0)
+            {
+                slope_y_neg = mhd::_internal::_ctSlope(fluxY, dev_conserved, -1, 0, 1, 2, 1, 2, xid, yid, zid, nx, ny, n_cells);
+            }
+            else if (signUpwind < 0.0)
+            {
+                slope_y_neg = mhd::_internal::_ctSlope(fluxY, dev_conserved, -1, 0, 1, -1, 1, -1, xid, yid, zid, nx, ny, n_cells);
+            }
+            else
+            {
+                slope_y_neg = 0.5 * (mhd::_internal::_ctSlope(fluxY, dev_conserved, -1, 0, 1,  2, 1,  2, xid, yid, zid, nx, ny, n_cells)
+                                   + mhd::_internal::_ctSlope(fluxY, dev_conserved, -1, 0, 1, -1, 1, -1, xid, yid, zid, nx, ny, n_cells));
+            }
+
+            // Z-direction slope on the positive Z side
+            signUpwind = fluxY[cuda_utilities::compute1DIndex(xid, yid-1, zid, nx, ny)];
+            if (signUpwind > 0.0)
+            {
+                slope_z_pos = mhd::_internal::_ctSlope(fluxZ, dev_conserved, 1, 0, 1, -1, 1, 2, xid, yid, zid, nx, ny, n_cells);
+            }
+            else if (signUpwind < 0.0)
+            {
+                slope_z_pos = mhd::_internal::_ctSlope(fluxZ, dev_conserved, 1, 0, -1, -1, 2, -1, xid, yid, zid, nx, ny, n_cells);
+            }
+            else
+            {
+                slope_z_pos = 0.5 * (mhd::_internal::_ctSlope(fluxZ, dev_conserved, 1, 0,  1, -1, 1,  2, xid, yid, zid, nx, ny, n_cells)
+                                   + mhd::_internal::_ctSlope(fluxZ, dev_conserved, 1, 0, -1, -1, 2, -1, xid, yid, zid, nx, ny, n_cells));
+            }
+
+            // Z-direction slope on the negative Z side
+            signUpwind = fluxY[cuda_utilities::compute1DIndex(xid, yid-1, zid-1, nx, ny)];
+            if (signUpwind > 0.0)
+            {
+                slope_z_neg = mhd::_internal::_ctSlope(fluxZ, dev_conserved, 1, 0, 1, 2, 1, 2, xid, yid, zid, nx, ny, n_cells);
+            }
+            else if (signUpwind < 0.0)
+            {
+                slope_z_neg = mhd::_internal::_ctSlope(fluxZ, dev_conserved, 1, 0, 2, -1, -1, 2, xid, yid, zid, nx, ny, n_cells);
+            }
+            else
+            {
+                slope_z_neg = 0.5 * (mhd::_internal::_ctSlope(fluxZ, dev_conserved, 1, 0, 1,  2, 1,  2, xid, yid, zid, nx, ny, n_cells)
+                                   + mhd::_internal::_ctSlope(fluxZ, dev_conserved, 1, 0, 2, -1, -1, 2, xid, yid, zid, nx, ny, n_cells));
+            }
+
+            // Load the face centered electric fields  Note the negative signs to
+            // convert from magnetic flux to electric field
+
+            face_y_pos = + fluxZ[cuda_utilities::compute1DIndex(xid  , yid  , zid-1, nx, ny) + (6+NSCALARS)*n_cells];
+            face_y_neg = + fluxZ[cuda_utilities::compute1DIndex(xid  , yid-1, zid-1, nx, ny) + (6+NSCALARS)*n_cells];
+            face_z_pos = - fluxY[cuda_utilities::compute1DIndex(xid  , yid-1, zid  , nx, ny) + (5+NSCALARS)*n_cells];
+            face_z_neg = - fluxY[cuda_utilities::compute1DIndex(xid  , yid-1, zid-1, nx, ny) + (5+NSCALARS)*n_cells];
+
+            // sum and average face centered electric fields and slopes to get the
+            // edge averaged electric field.
+            ctElectricFields[threadId + 0*n_cells] = 0.25 * (+ face_y_pos
+                                                             + face_y_neg
+                                                             + face_z_pos
+                                                             + face_z_neg
+                                                             + slope_y_pos
+                                                             + slope_y_neg
+                                                             + slope_z_pos
+                                                             + slope_z_neg);
+
+            // ================
+            // Y electric field
+            // ================
+
+            // X-direction slope on the positive X side
+            signUpwind = fluxZ[cuda_utilities::compute1DIndex(xid, yid, zid-1, nx, ny)];
+            if (signUpwind > 0.0)
+            {
+                slope_x_pos = mhd::_internal::_ctSlope(fluxX, dev_conserved, 1, 1, 2, -1, 0, 2, xid, yid, zid, nx, ny, n_cells);
+            }
+            else if (signUpwind < 0.0)
+            {
+                slope_x_pos = mhd::_internal::_ctSlope(fluxX, dev_conserved, 1, 1, -1, -1, 0, -1, xid, yid, zid, nx, ny, n_cells);
+            }
+            else
+            {
+                slope_x_pos = 0.5 * (mhd::_internal::_ctSlope(fluxX, dev_conserved, 1, 1,  2, -1, 0,  2, xid, yid, zid, nx, ny, n_cells)
+                                   + mhd::_internal::_ctSlope(fluxX, dev_conserved, 1, 1, -1, -1, 0, -1, xid, yid, zid, nx, ny, n_cells));
+            }
+
+            // X-direction slope on the negative X side
+            signUpwind = fluxZ[cuda_utilities::compute1DIndex(xid-1, yid, zid-1, nx, ny)];
+            if (signUpwind > 0.0)
+            {
+                slope_x_neg = mhd::_internal::_ctSlope(fluxX, dev_conserved, 1, 1, 0, 2, 0, 2, xid, yid, zid, nx, ny, n_cells);
+            }
+            else if (signUpwind < 0.0)
+            {
+                slope_x_neg = mhd::_internal::_ctSlope(fluxX, dev_conserved, 1, 1, 0, -1, 0, -1, xid, yid, zid, nx, ny, n_cells);
+            }
+            else
+            {
+                slope_x_neg = 0.5 * (mhd::_internal::_ctSlope(fluxX, dev_conserved, 1, 1, 0,  2, 0,  2, xid, yid, zid, nx, ny, n_cells)
+                                   + mhd::_internal::_ctSlope(fluxX, dev_conserved, 1, 1, 0, -1, 0, -1, xid, yid, zid, nx, ny, n_cells));
+            }
+
+            // Z-direction slope on the positive Z side
+            signUpwind = fluxX[cuda_utilities::compute1DIndex(xid-1, yid, zid, nx, ny)];
+            if (signUpwind > 0.0)
+            {
+                slope_z_pos = mhd::_internal::_ctSlope(fluxZ, dev_conserved, -1, 1, 0, -1, 0, 2, xid, yid, zid, nx, ny, n_cells);
+            }
+            else if (signUpwind < 0.0)
+            {
+                slope_z_pos = mhd::_internal::_ctSlope(fluxZ, dev_conserved, -1, 1, -1, -1, 2, -1, xid, yid, zid, nx, ny, n_cells);
+            }
+            else
+            {
+                slope_z_pos = 0.5 * (mhd::_internal::_ctSlope(fluxZ, dev_conserved, -1, 1,  0, -1, 0,  2, xid, yid, zid, nx, ny, n_cells)
+                                   + mhd::_internal::_ctSlope(fluxZ, dev_conserved, -1, 1, -1, -1, 2, -1, xid, yid, zid, nx, ny, n_cells));
+            }
+
+            // Z-direction slope on the negative Z side
+            signUpwind = fluxX[cuda_utilities::compute1DIndex(xid-1, yid, zid-1, nx, ny)];
+            if (signUpwind > 0.0)
+            {
+                slope_z_neg = mhd::_internal::_ctSlope(fluxZ, dev_conserved, -1, 1, 0, 2, 0, 2, xid, yid, zid, nx, ny, n_cells);
+            }
+            else if (signUpwind < 0.0)
+            {
+                slope_z_neg = mhd::_internal::_ctSlope(fluxZ, dev_conserved, -1, 1, 2, -1, 2, -1, xid, yid, zid, nx, ny, n_cells);
+            }
+            else
+            {
+                slope_z_neg = 0.5 * (mhd::_internal::_ctSlope(fluxZ, dev_conserved, -1, 1, 0,  2, 0,  2, xid, yid, zid, nx, ny, n_cells)
+                                   + mhd::_internal::_ctSlope(fluxZ, dev_conserved, -1, 1, 2, -1, 2, -1, xid, yid, zid, nx, ny, n_cells));
+            }
+
+            // Load the face centered electric fields  Note the negative signs to
+            // convert from magnetic flux to electric field
+            face_x_pos = - fluxZ[cuda_utilities::compute1DIndex(xid  , yid, zid-1, nx, ny) + (5+NSCALARS)*n_cells];
+            face_x_neg = - fluxZ[cuda_utilities::compute1DIndex(xid-1, yid, zid-1, nx, ny) + (5+NSCALARS)*n_cells];
+            face_z_pos = + fluxX[cuda_utilities::compute1DIndex(xid-1, yid, zid  , nx, ny) + (6+NSCALARS)*n_cells];
+            face_z_neg = + fluxX[cuda_utilities::compute1DIndex(xid-1, yid, zid-1, nx, ny) + (6+NSCALARS)*n_cells];
+
+            // sum and average face centered electric fields and slopes to get the
+            // edge averaged electric field.
+            ctElectricFields[threadId + 1*n_cells] = 0.25 * (+ face_x_pos
+                                                             + face_x_neg
+                                                             + face_z_pos
+                                                             + face_z_neg
+                                                             + slope_x_pos
+                                                             + slope_x_neg
+                                                             + slope_z_pos
+                                                             + slope_z_neg);
+
+            // ================
+            // Z electric field
+            // ================
+
+            // Y-direction slope on the positive Y side
+            signUpwind = fluxX[cuda_utilities::compute1DIndex(xid-1, yid, zid, nx, ny)];
+            if (signUpwind > 0.0)
+            {
+                slope_y_pos = mhd::_internal::_ctSlope(fluxY, dev_conserved, 1, 2, 0, -1, 0, 1, xid, yid, zid, nx, ny, n_cells);
+            }
+            else if (signUpwind < 0.0)
+            {
+                slope_y_pos = mhd::_internal::_ctSlope(fluxY, dev_conserved, 1, 2, -1, -1, 1, -1, xid, yid, zid, nx, ny, n_cells);
+            }
+            else
+            {
+                slope_y_pos = 0.5 * (mhd::_internal::_ctSlope(fluxY, dev_conserved, 1, 2,  0, -1, 0,  1, xid, yid, zid, nx, ny, n_cells)
+                                   + mhd::_internal::_ctSlope(fluxY, dev_conserved, 1, 2, -1, -1, 1, -1, xid, yid, zid, nx, ny, n_cells));
+            }
+
+            // Y-direction slope on the negative Y side
+            signUpwind = fluxX[cuda_utilities::compute1DIndex(xid-1, yid-1, zid, nx, ny)];
+            if (signUpwind > 0.0)
+            {
+                slope_y_neg = mhd::_internal::_ctSlope(fluxY, dev_conserved, 1, 2, 0, 1, 0, 1, xid, yid, zid, nx, ny, n_cells);
+            }
+            else if (signUpwind < 0.0)
+            {
+                slope_y_neg = mhd::_internal::_ctSlope(fluxY, dev_conserved, 1, 2, 1, -1, 1, -1, xid, yid, zid, nx, ny, n_cells);
+            }
+            else
+            {
+                slope_y_neg = 0.5 * (mhd::_internal::_ctSlope(fluxY, dev_conserved, 1, 2, 0,  1, 0,  1, xid, yid, zid, nx, ny, n_cells)
+                                   + mhd::_internal::_ctSlope(fluxY, dev_conserved, 1, 2, 1, -1, 1, -1, xid, yid, zid, nx, ny, n_cells));
+            }
+
+            // X-direction slope on the positive X side
+            signUpwind = fluxY[cuda_utilities::compute1DIndex(xid, yid-1, zid, nx, ny)];
+            if (signUpwind > 0.0)
+            {
+                slope_x_pos = mhd::_internal::_ctSlope(fluxX, dev_conserved, -1, 2, 1, -1, 0, 1, xid, yid, zid, nx, ny, n_cells);
+            }
+            else if (signUpwind < 0.0)
+            {
+                slope_x_pos = mhd::_internal::_ctSlope(fluxX, dev_conserved, -1, 2, -1, -1, 0, -1, xid, yid, zid, nx, ny, n_cells);
+            }
+            else
+            {
+                slope_x_pos = 0.5 * (mhd::_internal::_ctSlope(fluxX, dev_conserved, -1, 2,  1, -1, 0,  1, xid, yid, zid, nx, ny, n_cells)
+                                   + mhd::_internal::_ctSlope(fluxX, dev_conserved, -1, 2, -1, -1, 0, -1, xid, yid, zid, nx, ny, n_cells));
+            }
+
+            // X-direction slope on the negative X side
+            signUpwind = fluxY[cuda_utilities::compute1DIndex(xid-1, yid-1, zid, nx, ny)];
+            if (signUpwind > 0.0)
+            {
+                slope_x_neg = mhd::_internal::_ctSlope(fluxX, dev_conserved, -1, 2, 0, 1, 0, 1, xid, yid, zid, nx, ny, n_cells);
+            }
+            else if (signUpwind < 0.0)
+            {
+                slope_x_neg = mhd::_internal::_ctSlope(fluxX, dev_conserved, -1, 2, 0, -1, 0, -1, xid, yid, zid, nx, ny, n_cells);
+            }
+            else
+            {
+                slope_x_neg = 0.5 * (mhd::_internal::_ctSlope(fluxX, dev_conserved, -1, 2, 0,  1, 0,  1, xid, yid, zid, nx, ny, n_cells)
+                                   + mhd::_internal::_ctSlope(fluxX, dev_conserved, -1, 2, 0, -1, 0, -1, xid, yid, zid, nx, ny, n_cells));
+            }
+
+            // Load the face centered electric fields  Note the negative signs to
+            // convert from magnetic flux to electric field
+            face_x_pos = + fluxY[cuda_utilities::compute1DIndex(xid  , yid-1, zid, nx, ny) + (6+NSCALARS)*n_cells];
+            face_x_neg = + fluxY[cuda_utilities::compute1DIndex(xid-1, yid-1, zid, nx, ny) + (6+NSCALARS)*n_cells];
+            face_y_pos = - fluxX[cuda_utilities::compute1DIndex(xid-1, yid  , zid, nx, ny) + (5+NSCALARS)*n_cells];
+            face_y_neg = - fluxX[cuda_utilities::compute1DIndex(xid-1, yid-1, zid, nx, ny) + (5+NSCALARS)*n_cells];
+
+            // sum and average face centered electric fields and slopes to get the
+            // edge averaged electric field.
+            ctElectricFields[threadId + 2*n_cells] = 0.25 * (+ face_x_pos
+                                                             + face_x_neg
+                                                             + face_y_pos
+                                                             + face_y_neg
+                                                             + slope_x_pos
+                                                             + slope_x_neg
+                                                             + slope_y_pos
+                                                             + slope_y_neg);
+        }
+    }
+    // =========================================================================
+} // end namespace mhd
\ No newline at end of file
diff --git a/src/mhd/ct_electric_fields.h b/src/mhd/ct_electric_fields.h
new file mode 100644
index 000000000..987633461
--- /dev/null
+++ b/src/mhd/ct_electric_fields.h
@@ -0,0 +1,155 @@
+/*!
+ * \file ct_electric_fields.h
+ * \author Robert 'Bob' Caddy (rvc@pitt.edu)
+ * \brief Contains the declaration for the kernel that computes the CT electric fields
+ *
+ */
+
+#pragma once
+
+// STL Includes
+
+// External Includes
+
+// Local Includes
+#include "../global/global.h"
+#include "../global/global_cuda.h"
+#include "../utils/gpu.hpp"
+#include "../utils/cuda_utilities.h"
+
+/*!
+ * \brief Namespace for MHD code
+ *
+ */
+namespace mhd
+{
+    /*!
+     * \brief Namespace for functions required by functions within the mhd
+     * namespace. Everything in this name space should be regarded as private
+     * but is made accesible for testing
+     *
+     */
+    namespace _internal
+    {
+        // =====================================================================
+        /*!
+         * \brief Compute and return the slope of the electric field used to
+           compute the CT electric fields
+         *
+         * \param[in] flux The flux array
+         * \param[in] dev_conserved The conserved variable array
+         * \param[in] fluxSign The sign of the flux to convert it to magnetic
+         * field. Also serves to choose which magnetic flux is used, i.e. the Y
+         * or Z field
+         * \param[in] ctDirection The direction of the CT field that this slope
+           will be used to calculate
+         * \param[in] conservedQuadrent1 Which index should be reduced by one to get the correct conserved variables. Options are -1 for no reduction, 0 for reducing xid, 1 for reducing yid, and 2 for reducing zid
+         * \param[in] conservedQuadrent2 Which index should be reduced by one to get the correct conserved variables. Options are -1 for no reduction, 0 for reducing xid, 1 for reducing yid, and 2 for reducing zid
+         * \param[in] fluxQuadrent1 Which index should be reduced by one to get the correct flux variable. Options are -1 for no reduction, 0 for reducing xid, 1 for reducing yid, and 2 for reducing zid
+         * \param[in] fluxQuadrent2 Which index should be reduced by one to get the correct flux variable. Options are -1 for no reduction, 0 for reducing xid, 1 for reducing yid, and 2 for reducing zid
+         * \param[in] xid The x index
+         * \param[in] yid The y index
+         * \param[in] zid The z index
+         * \param[in] nx The number of cells in the x-direction
+         * \param[in] ny The number of cells in the y-direction
+         * \param[in] n_cells The total number of cells
+         * \return Real The slope of the electric field
+         */
+        inline __host__ __device__ Real _ctSlope(Real const *flux,
+                                                 Real const *dev_conserved,
+                                                 Real const &fluxSign,
+                                                 int  const &ctDirection,
+                                                 int  const &conservedQuadrent1,
+                                                 int  const &conservedQuadrent2,
+                                                 int  const &fluxQuadrent1,
+                                                 int  const &fluxQuadrent2,
+                                                 int  const &xid,
+                                                 int  const &yid,
+                                                 int  const &zid,
+                                                 int  const &nx,
+                                                 int  const &ny,
+                                                 int  const &n_cells
+                                                 )
+        {
+            // Compute the various required indices
+
+            // Get the shifted modulos of the ctDirection.
+            int const modPlus1 = (ctDirection + 1) % 3;
+            int const modPlus2 = (ctDirection + 2) % 3;
+
+            // Indices for the cell centered values
+            int const xidCentered = xid - int(conservedQuadrent1 == 0) - int(conservedQuadrent2 == 0);
+            int const yidCentered = yid - int(conservedQuadrent1 == 1) - int(conservedQuadrent2 == 1);
+            int const zidCentered = zid - int(conservedQuadrent1 == 2) - int(conservedQuadrent2 == 2);
+            int const idxCentered = cuda_utilities::compute1DIndex(xidCentered, yidCentered, zidCentered, nx, ny);
+
+            // Index for the flux
+            int const idxFlux     = cuda_utilities::compute1DIndex(xid - int(fluxQuadrent1 == 0) - int(fluxQuadrent2 == 0),
+                                                                   yid - int(fluxQuadrent1 == 1) - int(fluxQuadrent2 == 1),
+                                                                   zid - int(fluxQuadrent1 == 2) - int(fluxQuadrent2 == 2),
+                                                                   nx, ny);
+
+            // Indices for the face centered magnetic fields that need to be averaged
+            int const idxB2Shift  = cuda_utilities::compute1DIndex(xidCentered - int(modPlus1 == 0),
+                                                                   yidCentered - int(modPlus1 == 1),
+                                                                   zidCentered - int(modPlus1 == 2),
+                                                                   nx, ny);
+            int const idxB3Shift  = cuda_utilities::compute1DIndex(xidCentered - int(modPlus2 == 0),
+                                                                   yidCentered - int(modPlus2 == 1),
+                                                                   zidCentered - int(modPlus2 == 2),
+                                                                   nx, ny);
+
+            // Load values for cell centered electric field. B1 (not present) is
+            // the magnetic field in the same direction as the `ctDirection`
+            // variable, B2 and B3 are the next two fields cyclically. i.e. if
+            // B1=Bx then B2=By and B3=Bz, if B1=By then B2=Bz and B3=Bx. The
+            // same rules apply for the momentum
+            Real const density    =          dev_conserved[idxCentered                                ];
+            Real const Momentum2  =          dev_conserved[idxCentered + (modPlus1+1)         *n_cells];
+            Real const Momentum3  =          dev_conserved[idxCentered + (modPlus2+1)         *n_cells];
+            Real const B2Centered = 0.5 * (  dev_conserved[idxCentered + (modPlus1+5+NSCALARS)*n_cells]
+                                           + dev_conserved[idxB2Shift  + (modPlus1+5+NSCALARS)*n_cells]);
+            Real const B3Centered = 0.5 * (  dev_conserved[idxCentered + (modPlus2+5+NSCALARS)*n_cells]
+                                           + dev_conserved[idxB3Shift  + (modPlus2+5+NSCALARS)*n_cells]);
+
+            // Compute the electric field in the center with a cross product
+            Real const electric_centered = (Momentum3*B2Centered - Momentum2*B3Centered) / density;
+
+            // Load face centered electric field, note fluxSign to correctly do
+            // the shift from magnetic flux to EMF/electric field and to choose
+            // which field to use
+            Real const electric_face = fluxSign * flux[idxFlux + (int(fluxSign == 1)+5+NSCALARS)*n_cells];
+
+            // Compute the slope and return it
+            return electric_face - electric_centered;
+        }
+        // =====================================================================
+    }// _mhd_internal namespace
+
+    // =========================================================================
+    /*!
+     * \brief Compute the Constrained Transport electric fields used to evolve
+     * the magnetic field. Note that this function requires that the density be
+     * non-zero or it will return Nans.
+     *
+     * \param[in] fluxX The flux on the x+1/2 face of each cell
+     * \param[in] fluxY The flux on the y+1/2 face of each cell
+     * \param[in] fluxZ The flux on the z+1/2 face of each cell
+     * \param[in] dev_conserved The device resident grid
+     * \param[out] ctElectricFields The CT electric fields
+     * \param[in] nx The number of cells in the x-direction
+     * \param[in] ny The number of cells in the y-direction
+     * \param[in] nz The number of cells in the z-direction
+     * \param[in] n_cells The total number of cells
+     */
+    __global__ void Calculate_CT_Electric_Fields(Real const *fluxX,
+                                                 Real const *fluxY,
+                                                 Real const *fluxZ,
+                                                 Real const *dev_conserved,
+                                                 Real *ctElectricFields,
+                                                 int const nx,
+                                                 int const ny,
+                                                 int const nz,
+                                                 int const n_cells);
+    // =========================================================================
+} // end  namespace mhd
\ No newline at end of file
diff --git a/src/mhd/ct_electric_fields_tests.cu b/src/mhd/ct_electric_fields_tests.cu
new file mode 100644
index 000000000..55b46f3c8
--- /dev/null
+++ b/src/mhd/ct_electric_fields_tests.cu
@@ -0,0 +1,207 @@
+/*!
+ * \file ct_electric_fields_tests.cu
+ * \author Robert 'Bob' Caddy (rvc@pitt.edu)
+ * \brief Tests for the CT electric fields
+ *
+ */
+
+// STL Includes
+#include <vector>
+#include <string>
+#include <iostream>
+#include <numeric>
+#include <cmath>
+
+// External Includes
+#include <gtest/gtest.h>    // Include GoogleTest and related libraries/headers
+
+// Local Includes
+#include "../utils/testing_utilities.h"
+#include "../mhd/ct_electric_fields.h"
+#include "../global/global.h"
+
+// =============================================================================
+// Tests for the mhd::Calculate_CT_Electric_Fields kernel
+// =============================================================================
+
+// =============================================================================
+/*!
+ * \brief Test fixture for tMHDCalculateCTElectricFields test suite
+ *
+ */
+class tMHDCalculateCTElectricFields : public ::testing::Test
+{
+public:
+
+    /*!
+     * \brief Initialize and allocate all the various required variables and
+    * arrays
+     *
+     */
+    tMHDCalculateCTElectricFields()
+        :
+        nx(3),
+        ny(nx),
+        nz(nx),
+        n_cells(nx*ny*nz),
+        fluxX(n_cells * (7+NSCALARS)),
+        fluxY(n_cells * (7+NSCALARS)),
+        fluxZ(n_cells * (7+NSCALARS)),
+        grid (n_cells * (8+NSCALARS)),
+        testCTElectricFields(n_cells * 3, -999.),
+        fiducialData(n_cells * 3, -999.),
+        dimGrid((n_cells + TPB - 1),1,1),
+        dimBlock(TPB,1,1)
+    {
+        // Allocate device arrays
+        CudaSafeCall ( cudaMalloc(&dev_fluxX, fluxX.size()*sizeof(double)) );
+        CudaSafeCall ( cudaMalloc(&dev_fluxY, fluxY.size()*sizeof(double)) );
+        CudaSafeCall ( cudaMalloc(&dev_fluxZ, fluxZ.size()*sizeof(double)) );
+        CudaSafeCall ( cudaMalloc(&dev_grid,   grid.size()*sizeof(double)) );
+        CudaSafeCall ( cudaMalloc(&dev_testCTElectricFields, testCTElectricFields.size()*sizeof(double)) );
+
+        // Populate the grids with values where vector.at(i) = double(i). The
+        // values chosen aren't that important, just that every cell has a unique
+        // value
+        std::iota(std::begin(fluxX), std::end(fluxX), 0.);
+        std::iota(std::begin(fluxY), std::end(fluxY), fluxX.back() + 1);
+        std::iota(std::begin(fluxZ), std::end(fluxZ), fluxY.back() + 1);
+        std::iota(std::begin(grid),  std::end(grid),  fluxZ.back() + 1);
+    }
+    ~tMHDCalculateCTElectricFields() = default;
+protected:
+    // Initialize the test grid and other state variables
+    size_t const nx, ny, nz;
+    size_t const n_cells;
+
+    // Launch Parameters
+    dim3 const dimGrid;  // How many blocks in the grid
+    dim3 const dimBlock;  // How many threads per block
+
+    // Make sure the vector is large enough that the locations where the
+    // magnetic field would be in the real grid are filled
+    std::vector<double> fluxX;
+    std::vector<double> fluxY;
+    std::vector<double> fluxZ;
+    std::vector<double> grid;
+    std::vector<double> testCTElectricFields;
+    std::vector<double> fiducialData;
+
+    // device pointers
+    double *dev_fluxX, *dev_fluxY, *dev_fluxZ, *dev_grid, *dev_testCTElectricFields;
+
+    /*!
+     * \brief Launch the kernel and check results
+     *
+     */
+    void runTest()
+    {
+        // Copy values to GPU
+        CudaSafeCall( cudaMemcpy(dev_fluxX, fluxX.data(), fluxX.size()*sizeof(Real), cudaMemcpyHostToDevice) );
+        CudaSafeCall( cudaMemcpy(dev_fluxY, fluxY.data(), fluxY.size()*sizeof(Real), cudaMemcpyHostToDevice) );
+        CudaSafeCall( cudaMemcpy(dev_fluxZ, fluxZ.data(), fluxZ.size()*sizeof(Real), cudaMemcpyHostToDevice) );
+        CudaSafeCall( cudaMemcpy(dev_grid,  grid.data(),   grid.size()*sizeof(Real), cudaMemcpyHostToDevice) );
+        CudaSafeCall( cudaMemcpy(dev_testCTElectricFields,
+                                 testCTElectricFields.data(),
+                                 testCTElectricFields.size()*sizeof(Real),
+                                 cudaMemcpyHostToDevice) );
+
+        // Call the kernel to test
+        hipLaunchKernelGGL(mhd::Calculate_CT_Electric_Fields,
+                           dimGrid,
+                           dimBlock,
+                           0,
+                           0,
+                           dev_fluxX,
+                           dev_fluxY,
+                           dev_fluxZ,
+                           dev_grid,
+                           dev_testCTElectricFields,
+                           nx,
+                           ny,
+                           nz,
+                           n_cells);
+        CudaCheckError();
+
+        // Copy test data back
+        CudaSafeCall( cudaMemcpy(testCTElectricFields.data(),
+                                 dev_testCTElectricFields,
+                                 testCTElectricFields.size()*sizeof(Real),
+                                 cudaMemcpyDeviceToHost) );
+        cudaDeviceSynchronize();
+
+        // Check the results
+        for (size_t i = 0; i < fiducialData.size(); i++)
+        {
+            int xid, yid, zid;
+            cuda_utilities::compute3DIndices(i, nx, ny, xid, yid, zid);
+            testingUtilities::checkResults(fiducialData.at(i),
+                                           testCTElectricFields.at(i),
+                                           "value at i = " + std::to_string(i)
+                                           + ", xid  = " + std::to_string(xid)
+                                           + ", yid  = " + std::to_string(yid)
+                                           + ", zid  = " + std::to_string(zid));
+        }
+    }
+};
+// =============================================================================
+
+// =============================================================================
+TEST_F(tMHDCalculateCTElectricFields,
+       PositiveVelocityExpectCorrectOutput)
+{
+    // Fiducial values
+    fiducialData.at(26) =  206.29859653255295;
+    fiducialData.at(53) = -334.90052254763339;
+    fiducialData.at(80) =  209.53472440298236;
+
+    // Launch kernel and check results
+    runTest();
+}
+// =============================================================================
+
+// =============================================================================
+TEST_F(tMHDCalculateCTElectricFields,
+       NegativeVelocityExpectCorrectOutput)
+{
+    // Fiducial values
+    fiducialData.at(26) =  203.35149422304994;
+    fiducialData.at(53) = -330.9860399765279;
+    fiducialData.at(80) =  208.55149905461991;
+
+    // Set the density fluxes to be negative to indicate a negative velocity
+    // across the face
+    for (size_t i = 0; i < n_cells; i++)
+    {
+        fluxX.at(i) = -fluxX.at(i);
+        fluxY.at(i) = -fluxY.at(i);
+        fluxZ.at(i) = -fluxZ.at(i);
+    }
+
+    // Launch kernel and check results
+    runTest();
+}
+// =============================================================================
+
+// =============================================================================
+TEST_F(tMHDCalculateCTElectricFields,
+       ZeroVelocityExpectCorrectOutput)
+{
+    // Fiducial values
+    fiducialData.at(26) =  204.82504537780144;
+    fiducialData.at(53) = -332.94328126208063;
+    fiducialData.at(80) =  209.04311172880114;
+
+    // Set the density fluxes to be negative to indicate a negative velocity
+    // across the face
+    for (size_t i = 0; i < n_cells; i++)
+    {
+        fluxX.at(i) = 0.0;
+        fluxY.at(i) = 0.0;
+        fluxZ.at(i) = 0.0;
+    }
+
+    // Launch kernel and check results
+    runTest();
+}
+// =============================================================================
diff --git a/src/mhd/magnetic_divergence.cu b/src/mhd/magnetic_divergence.cu
new file mode 100644
index 000000000..02051e48c
--- /dev/null
+++ b/src/mhd/magnetic_divergence.cu
@@ -0,0 +1,112 @@
+/*!
+ * \file mhd_utilities.cpp
+ * \author Robert 'Bob' Caddy (rvc@pitt.edu)
+ * \brief Contains the implementation of various utility functions for MHD and
+ * for the various kernels, functions, and tools required for the 3D VL+CT MHD
+ * integrator. Due to the CUDA/HIP compiler requiring that device functions be
+ * directly accessible to the file they're used in most device functions will be
+ * implemented in the header file
+ *
+ */
+
+// STL Includes
+#include <cfloat>
+#include <limits>
+
+// External Includes
+
+// Local Includes
+#include "../mhd/magnetic_divergence.h"
+#include "../utils/cuda_utilities.h"
+#include "../utils/reduction_utilities.h"
+#include "../utils/DeviceVector.h"
+
+namespace mhd
+{
+    // =========================================================================
+    __global__ void calculateMagneticDivergence(Real const *dev_conserved,
+                                                Real *dev_maxDivergence,
+                                                Real const dx,
+                                                Real const dy,
+                                                Real const dz,
+                                                int const nx,
+                                                int const ny,
+                                                int const nz,
+                                                int const n_cells)
+    {
+        // Variables to store the divergence
+        Real cellDivergence;
+        Real maxDivergence = 0.0;
+
+        // Index variables
+        int xid, yid, zid, id_xMin1, id_yMin1, id_zMin1;
+
+        // Grid stride loop to perform as much of the reduction as possible
+        for(size_t id = threadIdx.x + blockIdx.x * blockDim.x; id < n_cells; id += blockDim.x * gridDim.x)
+        {
+            // compute the real indices
+            cuda_utilities::compute3DIndices(id, nx, ny, xid, yid, zid);
+
+            // Thread guard to avoid overrun and to skip ghost cells that cannot
+            // have their divergences computed due to a missing face;
+            if (    xid > 1  and yid > 1  and zid > 1
+                and xid < nx and yid < ny and zid < nz)
+            {
+                // Compute the various offset indices
+                id_xMin1 = cuda_utilities::compute1DIndex(xid-1, yid  , zid  , nx, ny);
+                id_yMin1 = cuda_utilities::compute1DIndex(xid  , yid-1, zid  , nx, ny);
+                id_zMin1 = cuda_utilities::compute1DIndex(xid  , yid  , zid-1, nx, ny);
+
+                // Compute divergence
+                cellDivergence =
+                    ((   dev_conserved[id       + (5+NSCALARS)*n_cells]
+                       - dev_conserved[id_xMin1 + (5+NSCALARS)*n_cells])
+                    / dx)
+                    + (( dev_conserved[id       + (6+NSCALARS)*n_cells]
+                       - dev_conserved[id_yMin1 + (6+NSCALARS)*n_cells])
+                    / dy)
+                    + (( dev_conserved[id       + (7+NSCALARS)*n_cells]
+                       - dev_conserved[id_zMin1 + (7+NSCALARS)*n_cells])
+                    / dz);
+
+                maxDivergence = max(maxDivergence, fabs(cellDivergence));
+            }
+        }
+
+        // Perform reduction across the entire grid
+        reduction_utilities::gridReduceMax(maxDivergence, dev_maxDivergence);
+    }
+    // =========================================================================
+
+    // =========================================================================
+    Real launchCalculateMagneticDivergence(Real const *dev_conserved,
+                                           Real const dx,
+                                           Real const dy,
+                                           Real const dz,
+                                           int const nx,
+                                           int const ny,
+                                           int const nz,
+                                           int const n_cells)
+    {
+        // First let's create some variables we'll need.
+        cuda_utilities::AutomaticLaunchParams static const launchParams(mhd::calculateMagneticDivergence);
+        cuda_utilities::DeviceVector<Real> static dev_maxDivergence(1);
+
+        // Set the device side inverse time step to the smallest possible double
+        // so that the reduction isn't using the maximum value of the previous
+        // iteration
+        dev_maxDivergence.assign(std::numeric_limits<Real>::lowest());
+
+        // Now lets get the local maximum divergence
+        hipLaunchKernelGGL(mhd::calculateMagneticDivergence,
+                           launchParams.numBlocks, launchParams.threadsPerBlock, 0, 0,
+                           dev_conserved, dev_maxDivergence.data(),
+                           dx, dy, dz,
+                           nx, ny, nz,
+                           n_cells);
+        CudaCheckError();
+
+        return dev_maxDivergence[0];
+    }
+    // =========================================================================
+} // end namespace mhd
\ No newline at end of file
diff --git a/src/mhd/magnetic_divergence.h b/src/mhd/magnetic_divergence.h
new file mode 100644
index 000000000..8550591e2
--- /dev/null
+++ b/src/mhd/magnetic_divergence.h
@@ -0,0 +1,81 @@
+/*!
+ * \file magnetic_divergence.h
+ * \author Robert 'Bob' Caddy (rvc@pitt.edu)
+ * \brief Contains the declaration for the functions that compute the magnetic
+ * divergence
+ *
+ */
+
+#pragma once
+
+// STL Includes
+
+// External Includes
+
+// Local Includes
+#include "../global/global.h"
+#include "../global/global_cuda.h"
+#include "../utils/gpu.hpp"
+
+
+/*!
+ * \brief Namespace for MHD code
+ *
+ */
+namespace mhd
+{
+    // =========================================================================
+    /*!
+     * \brief Kernel to compute the maximum divergence of the magnetic field in
+     * the grid. Uses `reduction_utilities::gridReduceMax` and as such should be
+     * called with the minimum number of blocks. Recommend using the occupancy
+     * API
+     *
+     * \param[in] dev_conserved The device array of conserved variables
+     * \param[out] maxDivergence The device scalar to store the reduced divergence at
+     * \param[in] dx Cell size in the X-direction
+     * \param[in] dy Cell size in the Y-direction
+     * \param[in] dz Cell size in the Z-direction
+     * \param[in] nx Number of cells in the X-direction
+     * \param[in] ny Number of cells in the Y-direction
+     * \param[in] nz Number of cells in the Z-direction
+     * \param[in] n_cells Total number of cells
+     */
+    __global__ void calculateMagneticDivergence(Real const *dev_conserved,
+                                                Real *maxDivergence,
+                                                Real const dx,
+                                                Real const dy,
+                                                Real const dz,
+                                                int const nx,
+                                                int const ny,
+                                                int const nz,
+                                                int const n_cells);
+    // =========================================================================
+
+    // =========================================================================
+    /*!
+     * \brief Handling launching and returning the value from the
+     * `mhd::calculateMagneticDivergence` kernel
+     *
+     * \param[in] dev_conserved The device array of conserved variables
+     * \param[in] dx Cell size in the X-direction
+     * \param[in] dy Cell size in the Y-direction
+     * \param[in] dz Cell size in the Z-direction
+     * \param[in] nx Number of cells in the X-direction
+     * \param[in] ny Number of cells in the Y-direction
+     * \param[in] nz Number of cells in the Z-direction
+     * \param[in] n_cells Total number of cells
+     * \return Real The maximum divergence of the magnetic field in the local
+     * part of the grid
+     */
+    Real launchCalculateMagneticDivergence(Real const *dev_conserved,
+                                           Real const dx,
+                                           Real const dy,
+                                           Real const dz,
+                                           int const nx,
+                                           int const ny,
+                                           int const nz,
+                                           int const n_cells);
+    // =========================================================================
+
+} // end namespace mhd
\ No newline at end of file
diff --git a/src/mhd/magnetic_divergence_tests.cu b/src/mhd/magnetic_divergence_tests.cu
new file mode 100644
index 000000000..ba2695e53
--- /dev/null
+++ b/src/mhd/magnetic_divergence_tests.cu
@@ -0,0 +1,59 @@
+/*!
+ * \file magnetic_divergence_tests.cu
+ * \author Robert 'Bob' Caddy (rvc@pitt.edu)
+ * \brief Tests for the magnetic divergence code
+ *
+ */
+
+
+// STL Includes
+#include <vector>
+#include <string>
+#include <iostream>
+#include <random>
+
+// External Includes
+#include <gtest/gtest.h>    // Include GoogleTest and related libraries/headers
+
+// Local Includes
+#include "../utils/testing_utilities.h"
+#include "../mhd/magnetic_divergence.h"
+#include "../utils/DeviceVector.h"
+#include "../global/global.h"
+
+// =============================================================================
+// Tests for the magnetic field divergence functions
+// =============================================================================
+TEST(tMHDLaunchCalculateMagneticDivergence, CorrectInputExpectCorrectOutput)
+{
+    // Grid Parameters & testing parameters
+    size_t const gridSize = 96; // Needs to be at least 64 so that each thread has a value
+    size_t const n_ghost  = 4;
+    size_t const nx       = gridSize+2*n_ghost, ny = nx, nz = nx;
+    size_t const n_cells  = nx*ny*nz;
+    size_t const n_fields = 8;
+    Real   const dx       = 3, dy = dx, dz = dx;
+    std::vector<Real> host_grid(n_cells*n_fields);
+
+    // Fill grid with random values and randomly assign maximum value
+    std::mt19937 prng(1);
+    std::uniform_real_distribution<double> doubleRand(1, 5);
+    for (size_t i = 0; i < host_grid.size(); i++)
+    {
+        host_grid.at(i) = doubleRand(prng);
+    }
+
+    // Allocating and copying to device
+    cuda_utilities::DeviceVector<double> dev_grid(host_grid.size());
+    dev_grid.cpyHostToDevice(host_grid);
+
+    // Get test data
+    Real testDivergence = mhd::launchCalculateMagneticDivergence(dev_grid.data(), dx, dy, dz, nx, ny, nz, n_cells);
+
+    // Perform Comparison
+    Real const fiducialDivergence = 3.6318132783263106;
+    testingUtilities::checkResults(fiducialDivergence, testDivergence, "maximum divergence");
+}
+// =============================================================================
+// End of tests for the magnetic field divergence functions
+// =============================================================================
diff --git a/src/mhd/magnetic_update.cu b/src/mhd/magnetic_update.cu
new file mode 100644
index 000000000..78f298e05
--- /dev/null
+++ b/src/mhd/magnetic_update.cu
@@ -0,0 +1,80 @@
+/*!
+ * \file magnetic_update.cu
+ * \author Robert 'Bob' Caddy (rvc@pitt.edu)
+ * \brief Contains the definition of the kernel to update the magnetic field
+ *
+ */
+
+// STL Includes
+
+// External Includes
+
+// Local Includes
+#include "../mhd/magnetic_update.h"
+#include "../utils/cuda_utilities.h"
+
+namespace mhd
+{
+    // =========================================================================
+    __global__ void Update_Magnetic_Field_3D(Real *sourceGrid,
+                                             Real *destinationGrid,
+                                             Real *ctElectricFields,
+                                             int const nx,
+                                             int const ny,
+                                             int const nz,
+                                             int const n_cells,
+                                             Real const dt,
+                                             Real const dx,
+                                             Real const dy,
+                                             Real const dz)
+    {
+        // get a thread index
+        int const blockId  = blockIdx.x + blockIdx.y*gridDim.x;
+        int const threadId = threadIdx.x + blockId * blockDim.x;
+        int xid, yid, zid;
+        cuda_utilities::compute3DIndices(threadId, nx, ny, xid, yid, zid);
+
+        // Thread guard to avoid overrun and to skip ghost cells that cannot be
+        // evolved due to missing electric fields that can't be reconstructed
+        if (    xid < nx-1
+            and yid < ny-1
+            and zid < nz-1)
+        {
+            // Compute the three dt/dx quantities
+            Real const dtodx = dt/dx;
+            Real const dtody = dt/dy;
+            Real const dtodz = dt/dz;
+
+            // Load the various edge electric fields required. The '1' and '2'
+            // fields are not shared and the '3' fields are shared by two of the
+            // updates
+            Real electric_x_1 = ctElectricFields[(cuda_utilities::compute1DIndex(xid  , yid+1, zid  , nx, ny))];
+            Real electric_x_2 = ctElectricFields[(cuda_utilities::compute1DIndex(xid  , yid  , zid+1, nx, ny))];
+            Real electric_x_3 = ctElectricFields[(cuda_utilities::compute1DIndex(xid  , yid+1, zid+1, nx, ny))];
+            Real electric_y_1 = ctElectricFields[(cuda_utilities::compute1DIndex(xid+1, yid  , zid  , nx, ny)) + n_cells];
+            Real electric_y_2 = ctElectricFields[(cuda_utilities::compute1DIndex(xid  , yid  , zid+1, nx, ny)) + n_cells];
+            Real electric_y_3 = ctElectricFields[(cuda_utilities::compute1DIndex(xid+1, yid  , zid+1, nx, ny)) + n_cells];
+            Real electric_z_1 = ctElectricFields[(cuda_utilities::compute1DIndex(xid+1, yid  , zid  , nx, ny)) + 2 * n_cells];
+            Real electric_z_2 = ctElectricFields[(cuda_utilities::compute1DIndex(xid  , yid+1, zid  , nx, ny)) + 2 * n_cells];
+            Real electric_z_3 = ctElectricFields[(cuda_utilities::compute1DIndex(xid+1, yid+1, zid  , nx, ny)) + 2 * n_cells];
+
+            // Perform Updates
+
+            // X field update
+            destinationGrid[threadId + (5+NSCALARS)*n_cells] = sourceGrid[threadId + (5+NSCALARS)*n_cells]
+                + dtodz * (electric_y_3 - electric_y_1)
+                + dtody * (electric_z_1 - electric_z_3);
+
+            // Y field update
+            destinationGrid[threadId + (6+NSCALARS)*n_cells] = sourceGrid[threadId + (6+NSCALARS)*n_cells]
+                + dtodx * (electric_z_3 - electric_z_2)
+                + dtodz * (electric_x_1 - electric_x_3);
+
+            // Z field update
+            destinationGrid[threadId + (7+NSCALARS)*n_cells] = sourceGrid[threadId + (7+NSCALARS)*n_cells]
+                + dtody * (electric_x_3 - electric_x_2)
+                + dtodx * (electric_y_2 - electric_y_3);
+        }
+    }
+    // =========================================================================
+} // end namespace mhd
\ No newline at end of file
diff --git a/src/mhd/magnetic_update.h b/src/mhd/magnetic_update.h
new file mode 100644
index 000000000..2c89e26ba
--- /dev/null
+++ b/src/mhd/magnetic_update.h
@@ -0,0 +1,57 @@
+/*!
+ * \file magnetic_update.h
+ * \author Robert 'Bob' Caddy (rvc@pitt.edu)
+ * \brief Contains the declaration of the kernel to update the magnetic field
+ *
+ */
+
+#pragma once
+
+// STL Includes
+
+// External Includes
+
+// Local Includes
+#include "../global/global.h"
+#include "../global/global_cuda.h"
+#include "../utils/gpu.hpp"
+
+/*!
+ * \brief Namespace for MHD code
+ *
+ */
+namespace mhd
+{
+    // =========================================================================
+    /*!
+     * \brief Update the magnetic field using the CT electric fields
+     *
+     * \param[in] sourceGrid The array which holds the old values of the
+     * magnetic field
+     * \param[out] destinationGrid The array to hold the updated values of the
+     * magnetic field
+     * \param[in] ctElectricFields The array of constrained transport electric
+     * fields
+     * \param[in] nx The number of cells in the x-direction
+     * \param[in] ny The number of cells in the y-direction
+     * \param[in] nz The number of cells in the z-direction
+     * \param[in] n_cells The total number of cells
+     * \param[in] dt The time step. If doing the half time step update make sure
+     * to divide it by two when passing the time step to this kernel
+     * \param[in] dx The size of each cell in the x-direction
+     * \param[in] dy The size of each cell in the y-direction
+     * \param[in] dz The size of each cell in the z-direction
+     */
+    __global__ void Update_Magnetic_Field_3D(Real *sourceGrid,
+                                             Real *destinationGrid,
+                                             Real *ctElectricFields,
+                                             int const nx,
+                                             int const ny,
+                                             int const nz,
+                                             int const n_cells,
+                                             Real const dt,
+                                             Real const dx,
+                                             Real const dy,
+                                             Real const dz);
+    // =========================================================================
+} // end namespace mhd
\ No newline at end of file
diff --git a/src/mhd/magnetic_update_tests.cu b/src/mhd/magnetic_update_tests.cu
new file mode 100644
index 000000000..7cb4f68f2
--- /dev/null
+++ b/src/mhd/magnetic_update_tests.cu
@@ -0,0 +1,150 @@
+/*!
+ * \file magnetic_update_tests.cu
+ * \author Robert 'Bob' Caddy (rvc@pitt.edu)
+ * \brief Tests for the magnetic update code
+ *
+ */
+
+// STL Includes
+#include <vector>
+#include <string>
+#include <iostream>
+#include <numeric>
+
+// External Includes
+#include <gtest/gtest.h>    // Include GoogleTest and related libraries/headers
+
+// Local Includes
+#include "../utils/testing_utilities.h"
+#include "../utils/cuda_utilities.h"
+#include "../mhd/magnetic_update.h"
+
+// =============================================================================
+/*!
+ * \brief Test fixture for tMHDUpdateMagneticField3D test suite
+ *
+ */
+class tMHDUpdateMagneticField3D : public ::testing::Test
+{
+public:
+
+    /*!
+    * \brief Initialize and allocate all the various required variables and
+    * arrays
+    *
+    */
+    tMHDUpdateMagneticField3D()
+        :
+        nx(2),
+        ny(nx),
+        nz(nx),
+        n_cells(nx*ny*nz),
+        dt(3.2),
+        dx(2.5),
+        dy(2.5),
+        dz(2.5),
+        sourceGrid      (n_cells * (8+NSCALARS)),
+        destinationGrid (n_cells * (8+NSCALARS), -999.),
+        ctElectricFields(n_cells * 3),
+        fiducialData    (n_cells * (8+NSCALARS), -999.),
+        dimGrid((n_cells + TPB - 1),1,1),
+        dimBlock(TPB,1,1)
+    {
+        // Allocate device arrays
+        CudaSafeCall ( cudaMalloc(&dev_sourceGrid,             sourceGrid.size()*sizeof(double)) );
+        CudaSafeCall ( cudaMalloc(&dev_destinationGrid,   destinationGrid.size()*sizeof(double)) );
+        CudaSafeCall ( cudaMalloc(&dev_ctElectricFields, ctElectricFields.size()*sizeof(double)) );
+
+        // Populate the grids with values where vector.at(i) = double(i). The
+        // values chosen aren't that important, just that every cell has a unique
+        // value
+        std::iota(std::begin(sourceGrid), std::end(sourceGrid), 0.);
+        std::iota(std::begin(ctElectricFields), std::end(ctElectricFields), sourceGrid.back() + 1);
+    }
+    ~tMHDUpdateMagneticField3D() = default;
+protected:
+    // Initialize the test grid and other state variables
+    size_t const nx, ny, nz;
+    size_t const n_cells;
+    Real const dt, dx, dy, dz;
+
+    // Launch Parameters
+    dim3 const dimGrid;  // How many blocks in the grid
+    dim3 const dimBlock;  // How many threads per block
+
+    // Make sure the vector is large enough that the locations where the
+    // magnetic field would be in the real grid are filled
+    std::vector<double> sourceGrid;
+    std::vector<double> destinationGrid;
+    std::vector<double> ctElectricFields;
+    std::vector<double> fiducialData;
+
+    // device pointers
+    double *dev_sourceGrid, *dev_destinationGrid, *dev_ctElectricFields, *dev_fiducialData;
+
+    /*!
+    * \brief Launch the kernel and check results
+    *
+    */
+    void runTest()
+    {
+        // Copy values to GPU
+        CudaSafeCall( cudaMemcpy(dev_sourceGrid,             sourceGrid.data(),       sourceGrid.size()*sizeof(Real), cudaMemcpyHostToDevice) );
+        CudaSafeCall( cudaMemcpy(dev_destinationGrid,   destinationGrid.data(),  destinationGrid.size()*sizeof(Real), cudaMemcpyHostToDevice) );
+        CudaSafeCall( cudaMemcpy(dev_ctElectricFields, ctElectricFields.data(), ctElectricFields.size()*sizeof(Real), cudaMemcpyHostToDevice) );
+
+        // Call the kernel to test
+        hipLaunchKernelGGL(mhd::Update_Magnetic_Field_3D,
+                           dimGrid,
+                           dimBlock,
+                           0,
+                           0,
+                           dev_sourceGrid,
+                           dev_destinationGrid,
+                           dev_ctElectricFields,
+                           nx,
+                           ny,
+                           nz,
+                           n_cells,
+                           dt,
+                           dx,
+                           dy,
+                           dz);
+        CudaCheckError();
+
+        // Copy test data back
+        CudaSafeCall( cudaMemcpy(destinationGrid.data(),
+                                 dev_destinationGrid,
+                                 destinationGrid.size()*sizeof(Real),
+                                 cudaMemcpyDeviceToHost) );
+        cudaDeviceSynchronize();
+
+        // Check the results
+        for (size_t i = 0; i < fiducialData.size(); i++)
+        {
+            int xid, yid, zid;
+            cuda_utilities::compute3DIndices(i, nx, ny, xid, yid, zid);
+            testingUtilities::checkResults(fiducialData.at(i),
+                                           destinationGrid.at(i),
+                                           "value at i = " + std::to_string(i)
+                                             + ", xid  = " + std::to_string(xid)
+                                             + ", yid  = " + std::to_string(yid)
+                                             + ", zid  = " + std::to_string(zid));
+        }
+    }
+};
+// =============================================================================
+
+// =============================================================================
+TEST_F(tMHDUpdateMagneticField3D,
+       CorrectInputExpectCorrectOutput)
+{
+    // Fiducial values
+    fiducialData.at(40) = 42.559999999999995;
+    fiducialData.at(48) = 44.160000000000004;
+    fiducialData.at(56) = 57.280000000000001;
+
+    // Launch kernel and check results
+    runTest();
+}
+// =============================================================================
diff --git a/src/reconstruction/pcm_cuda.cu b/src/reconstruction/pcm_cuda.cu
index 1964ddedf..91fb75223 100644
--- a/src/reconstruction/pcm_cuda.cu
+++ b/src/reconstruction/pcm_cuda.cu
@@ -7,7 +7,8 @@
 #include "../global/global.h"
 #include "../global/global_cuda.h"
 #include "../reconstruction/pcm_cuda.h"
-
+#include "../utils/mhd_utilities.h"
+#include "../utils/cuda_utilities.h"
 
 __global__ void PCM_Reconstruction_1D(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bounds_R, int n_cells, int n_ghost, Real gamma, int n_fields)
 {
@@ -18,11 +19,11 @@ __global__ void PCM_Reconstruction_1D(Real *dev_conserved, Real *dev_bounds_L, R
 
   #ifdef DE
   Real ge;
-  #endif
+  #endif  //DE
 
   #ifdef SCALAR
   Real scalar[NSCALARS];
-  #endif
+  #endif  //SCALAR
 
   // get a global thread ID
   int xid = threadIdx.x + blockIdx.x*blockDim.x;
@@ -43,10 +44,10 @@ __global__ void PCM_Reconstruction_1D(Real *dev_conserved, Real *dev_bounds_L, R
     for (int i=0; i<NSCALARS; i++) {
       scalar[i] = dev_conserved[(5+i)*n_cells + id];
     }
-    #endif
+    #endif  //SCALAR
     #ifdef DE
     ge = dev_conserved[(n_fields-1)*n_cells + id];
-    #endif
+    #endif  //DE
 
     // send values back from the kernel
     dev_bounds_L[            id] = d;
@@ -58,10 +59,10 @@ __global__ void PCM_Reconstruction_1D(Real *dev_conserved, Real *dev_bounds_L, R
     for (int i=0; i<NSCALARS; i++) {
       dev_bounds_L[(5+i)*n_cells + id] = scalar[i];
     }
-    #endif
+    #endif  //SCALAR
     #ifdef DE
     dev_bounds_L[(n_fields-1)*n_cells + id] = ge;
-    #endif
+    #endif  //DE
 
     // retrieve appropriate conserved variables
     id = xid+1;
@@ -74,10 +75,10 @@ __global__ void PCM_Reconstruction_1D(Real *dev_conserved, Real *dev_bounds_L, R
     for (int i=0; i<NSCALARS; i++) {
       scalar[i] = dev_conserved[(5+i)*n_cells + id];
     }
-    #endif
+    #endif  //SCALAR
     #ifdef DE
     ge = dev_conserved[(n_fields-1)*n_cells + id];
-    #endif
+    #endif  //DE
 
     // send values back from the kernel
     id = xid;
@@ -90,10 +91,10 @@ __global__ void PCM_Reconstruction_1D(Real *dev_conserved, Real *dev_bounds_L, R
     for (int i=0; i<NSCALARS; i++) {
       dev_bounds_R[(5+i)*n_cells + id] = scalar[i];
     }
-    #endif
+    #endif  //SCALAR
     #ifdef DE
     dev_bounds_R[(n_fields-1)*n_cells + id] = ge;
-    #endif
+    #endif  //DE
 
   }
 
@@ -108,10 +109,10 @@ __global__ void PCM_Reconstruction_2D(Real *dev_conserved, Real *dev_bounds_Lx,
   Real d, mx, my, mz, E;
   #ifdef DE
   Real ge;
-  #endif
+  #endif  //DE
   #ifdef SCALAR
   Real scalar[NSCALARS];
-  #endif
+  #endif  //SCALAR
 
   int n_cells = nx*ny;
 
@@ -137,10 +138,10 @@ __global__ void PCM_Reconstruction_2D(Real *dev_conserved, Real *dev_bounds_Lx,
     for (int i=0; i<NSCALARS; i++) {
       scalar[i] = dev_conserved[(5+i)*n_cells + id];
     }
-    #endif
+    #endif  //SCALAR
     #ifdef DE
     ge = dev_conserved[(n_fields-1)*n_cells + id];
-    #endif
+    #endif  //DE
 
     // send values back from the kernel
     dev_bounds_Lx[            id] = d;
@@ -152,10 +153,10 @@ __global__ void PCM_Reconstruction_2D(Real *dev_conserved, Real *dev_bounds_Lx,
     for (int i=0; i<NSCALARS; i++) {
       dev_bounds_Lx[(5+i)*n_cells + id] = scalar[i];
     }
-    #endif
+    #endif  //SCALAR
     #ifdef DE
     dev_bounds_Lx[(n_fields-1)*n_cells + id] = ge;
-    #endif
+    #endif  //DE
 
     // retrieve appropriate conserved variables
     id = xid+1 + yid*nx;
@@ -168,10 +169,10 @@ __global__ void PCM_Reconstruction_2D(Real *dev_conserved, Real *dev_bounds_Lx,
     for (int i=0; i<NSCALARS; i++) {
       scalar[i] = dev_conserved[(5+i)*n_cells + id];
     }
-    #endif
+    #endif  //SCALAR
     #ifdef DE
     ge = dev_conserved[(n_fields-1)*n_cells + id];
-    #endif
+    #endif  //DE
 
     // send values back from the kernel
     id = xid + yid*nx;
@@ -184,10 +185,10 @@ __global__ void PCM_Reconstruction_2D(Real *dev_conserved, Real *dev_bounds_Lx,
     for (int i=0; i<NSCALARS; i++) {
       dev_bounds_Rx[(5+i)*n_cells + id] = scalar[i];
     }
-    #endif
+    #endif  //SCALAR
     #ifdef DE
     dev_bounds_Rx[(n_fields-1)*n_cells + id] = ge;
-    #endif
+    #endif  //DE
   }
 
   // y direction
@@ -204,10 +205,10 @@ __global__ void PCM_Reconstruction_2D(Real *dev_conserved, Real *dev_bounds_Lx,
     for (int i=0; i<NSCALARS; i++) {
       scalar[i] = dev_conserved[(5+i)*n_cells + id];
     }
-    #endif
+    #endif  //SCALAR
     #ifdef DE
     ge = dev_conserved[(n_fields-1)*n_cells + id];
-    #endif
+    #endif  //DE
 
     // send values back from the kernel
     dev_bounds_Ly[            id] = d;
@@ -219,10 +220,10 @@ __global__ void PCM_Reconstruction_2D(Real *dev_conserved, Real *dev_bounds_Lx,
     for (int i=0; i<NSCALARS; i++) {
       dev_bounds_Ly[(5+i)*n_cells + id] = scalar[i];
     }
-    #endif
+    #endif  //SCALAR
     #ifdef DE
     dev_bounds_Ly[(n_fields-1)*n_cells + id] = ge;
-    #endif
+    #endif  //DE
 
     // retrieve appropriate conserved variables
     id = xid + (yid+1)*nx;
@@ -235,10 +236,10 @@ __global__ void PCM_Reconstruction_2D(Real *dev_conserved, Real *dev_bounds_Lx,
     for (int i=0; i<NSCALARS; i++) {
       scalar[i] = dev_conserved[(5+i)*n_cells + id];
     }
-    #endif
+    #endif  //SCALAR
     #ifdef DE
     ge = dev_conserved[(n_fields-1)*n_cells + id];
-    #endif
+    #endif  //DE
 
     // send values back from the kernel
     id = xid + yid*nx;
@@ -251,10 +252,10 @@ __global__ void PCM_Reconstruction_2D(Real *dev_conserved, Real *dev_bounds_Lx,
     for (int i=0; i<NSCALARS; i++) {
       dev_bounds_Ry[(5+i)*n_cells + id] = scalar[i];
     }
-    #endif
+    #endif  //SCALAR
     #ifdef DE
     dev_bounds_Ry[(n_fields-1)*n_cells + id] = ge;
-    #endif
+    #endif  //DE
   }
 
 }
@@ -269,224 +270,179 @@ __global__ void PCM_Reconstruction_3D(Real *dev_conserved,
 
   // declare conserved variables for each stencil
   // these will be placed into registers for each thread
-  Real d, mx, my, mz, E;
-  #ifdef DE
-  Real ge;
-  #endif
   #ifdef SCALAR
   Real scalar[NSCALARS];
-  #endif
-
+  #endif  //SCALAR
 
-  int n_cells = nx*ny*nz;
+  int const n_cells = nx*ny*nz;
 
   // get a thread ID
-  int tid = threadIdx.x + blockIdx.x * blockDim.x;
-  int zid = tid / (nx*ny);
-  int yid = (tid - zid*nx*ny) / nx;
-  int xid = tid - zid*nx*ny - yid*nx;
-  int id = xid + yid*nx + zid*nx*ny;
+  int id = threadIdx.x + blockIdx.x * blockDim.x;
+  int xid, yid, zid;
+  cuda_utilities::compute3DIndices(id, nx, ny, xid, yid, zid);
 
-  // x direction
-  if (xid < nx-1 && yid < ny && zid < nz)
+  // Guard to avoid out of bounds threads
+  if (xid < nx && yid < ny && zid < nz)
   {
-    // retrieve appropriate conserved variables
-    id = xid + yid*nx + zid*nx*ny;
-    d  = dev_conserved[            id];
-    mx = dev_conserved[  n_cells + id];
-    my = dev_conserved[2*n_cells + id];
-    mz = dev_conserved[3*n_cells + id];
-    E  = dev_conserved[4*n_cells + id];
+    // ========================================
+    // Retrieve appropriate conserved variables
+    // ========================================
+    Real const d  = dev_conserved[            id];
+    Real const mx = dev_conserved[  n_cells + id];
+    Real const my = dev_conserved[2*n_cells + id];
+    Real const mz = dev_conserved[3*n_cells + id];
+    Real const E  = dev_conserved[4*n_cells + id];
     #ifdef SCALAR
-    for (int i=0; i<NSCALARS; i++) {
-      scalar[i] = dev_conserved[(5+i)*n_cells + id];
-    }
-    #endif
+      for (int i=0; i<NSCALARS; i++)
+      {
+        scalar[i] = dev_conserved[(5+i)*n_cells + id];
+      }
+    #endif  //SCALAR
+    #ifdef  MHD
+      Real cellCenteredBx, cellCenteredBy, cellCenteredBz;
+      mhd::utils::cellCenteredMagneticFields(dev_conserved,
+                                           id, xid, yid, zid, n_cells, nx, ny,
+                                           cellCenteredBx, cellCenteredBy, cellCenteredBz);
+    #endif  //MHD
     #ifdef DE
-    ge = dev_conserved[(n_fields-1)*n_cells + id];
-    #endif
+      Real const ge = dev_conserved[(n_fields-1)*n_cells + id];
+    #endif  //DE
 
-    // send values back from the kernel
+    // ================================
+    // Send values back from the kernel
+    // ================================
+
+    // Send the x+1/2 Left interface
     dev_bounds_Lx[            id] = d;
     dev_bounds_Lx[  n_cells + id] = mx;
     dev_bounds_Lx[2*n_cells + id] = my;
     dev_bounds_Lx[3*n_cells + id] = mz;
     dev_bounds_Lx[4*n_cells + id] = E;
     #ifdef SCALAR
-    for (int i=0; i<NSCALARS; i++) {
-      dev_bounds_Lx[(5+i)*n_cells + id] = scalar[i];
-    }
-    #endif
+      for (int i=0; i<NSCALARS; i++)
+      {
+        dev_bounds_Lx[(5+i)*n_cells + id] = scalar[i];
+      }
+    #endif  //SCALAR
+    #ifdef  MHD
+      dev_bounds_Lx[(5+NSCALARS)*n_cells + id] = cellCenteredBy;
+      dev_bounds_Lx[(6+NSCALARS)*n_cells + id] = cellCenteredBz;
+    #endif  //MHD
     #ifdef DE
-    dev_bounds_Lx[(n_fields-1)*n_cells + id] = ge;
-    #endif
+      dev_bounds_Lx[(n_fields-1)*n_cells + id] = ge;
+    #endif  //DE
 
-    // retrieve appropriate conserved variables
-    id = xid+1 + yid*nx + zid*nx*ny;
-    d  = dev_conserved[            id];
-    mx = dev_conserved[  n_cells + id];
-    my = dev_conserved[2*n_cells + id];
-    mz = dev_conserved[3*n_cells + id];
-    E  = dev_conserved[4*n_cells + id];
-    #ifdef SCALAR
-    for (int i=0; i<NSCALARS; i++) {
-      scalar[i] = dev_conserved[(5+i)*n_cells + id];
-    }
-    #endif
-    #ifdef DE
-    ge = dev_conserved[(n_fields-1)*n_cells + id];
-    #endif
-
-    // send values back from the kernel
-    id = xid + yid*nx + zid*nx*ny;
-    dev_bounds_Rx[            id] = d;
-    dev_bounds_Rx[  n_cells + id] = mx;
-    dev_bounds_Rx[2*n_cells + id] = my;
-    dev_bounds_Rx[3*n_cells + id] = mz;
-    dev_bounds_Rx[4*n_cells + id] = E;
-    #ifdef SCALAR
-    for (int i=0; i<NSCALARS; i++) {
-      dev_bounds_Rx[(5+i)*n_cells + id] = scalar[i];
-    }
-    #endif
-    #ifdef DE
-    dev_bounds_Rx[(n_fields-1)*n_cells + id] = ge;
-    #endif
-  }
-
-  // y direction
-  if (xid < nx && yid < ny-1 && zid < nz)
-  {
-    // retrieve appropriate conserved variables
-    id = xid + yid*nx + zid*nx*ny;
-    d  = dev_conserved[            id];
-    mx = dev_conserved[  n_cells + id];
-    my = dev_conserved[2*n_cells + id];
-    mz = dev_conserved[3*n_cells + id];
-    E  = dev_conserved[4*n_cells + id];
-    #ifdef SCALAR
-    for (int i=0; i<NSCALARS; i++) {
-      scalar[i] = dev_conserved[(5+i)*n_cells + id];
-    }
-    #endif
-    #ifdef DE
-    ge = dev_conserved[(n_fields-1)*n_cells + id];
-    #endif
-
-    // send values back from the kernel
+    // Send the y+1/2 Left interface
     dev_bounds_Ly[            id] = d;
     dev_bounds_Ly[  n_cells + id] = mx;
     dev_bounds_Ly[2*n_cells + id] = my;
     dev_bounds_Ly[3*n_cells + id] = mz;
     dev_bounds_Ly[4*n_cells + id] = E;
     #ifdef SCALAR
-    for (int i=0; i<NSCALARS; i++) {
-      dev_bounds_Ly[(5+i)*n_cells + id] = scalar[i];
-    }
-    #endif
+      for (int i=0; i<NSCALARS; i++)
+      {
+        dev_bounds_Ly[(5+i)*n_cells + id] = scalar[i];
+      }
+    #endif  //SCALAR
+    #ifdef  MHD
+      dev_bounds_Ly[(5+NSCALARS)*n_cells + id] = cellCenteredBz;
+      dev_bounds_Ly[(6+NSCALARS)*n_cells + id] = cellCenteredBx;
+    #endif  //MHD
     #ifdef DE
-    dev_bounds_Ly[(n_fields-1)*n_cells + id] = ge;
-    #endif
-
-    // retrieve appropriate conserved variables
-    id = xid + (yid+1)*nx + zid*nx*ny;
-    d  = dev_conserved[            id];
-    mx = dev_conserved[  n_cells + id];
-    my = dev_conserved[2*n_cells + id];
-    mz = dev_conserved[3*n_cells + id];
-    E  = dev_conserved[4*n_cells + id];
-    #ifdef SCALAR
-    for (int i=0; i<NSCALARS; i++) {
-      scalar[i] = dev_conserved[(5+i)*n_cells + id];
-    }
-    #endif
-    #ifdef DE
-    ge = dev_conserved[(n_fields-1)*n_cells + id];
-    #endif
+      dev_bounds_Ly[(n_fields-1)*n_cells + id] = ge;
+    #endif  //DE
 
-    // send values back from the kernel
-    id = xid + yid*nx + zid*nx*ny;
-    dev_bounds_Ry[            id] = d;
-    dev_bounds_Ry[  n_cells + id] = mx;
-    dev_bounds_Ry[2*n_cells + id] = my;
-    dev_bounds_Ry[3*n_cells + id] = mz;
-    dev_bounds_Ry[4*n_cells + id] = E;
-    #ifdef SCALAR
-    for (int i=0; i<NSCALARS; i++) {
-      dev_bounds_Ry[(5+i)*n_cells + id] = scalar[i];
-    }
-    #endif
-    #ifdef DE
-    dev_bounds_Ry[(n_fields-1)*n_cells + id] = ge;
-    #endif
-  }
-
-  // z direction
-  if (xid < nx && yid < ny && zid < nz-1)
-  {
-    // retrieve appropriate conserved variables
-    id = xid + yid*nx + zid*nx*ny;
-    d  = dev_conserved[            id];
-    mx = dev_conserved[  n_cells + id];
-    my = dev_conserved[2*n_cells + id];
-    mz = dev_conserved[3*n_cells + id];
-    E  = dev_conserved[4*n_cells + id];
-    #ifdef SCALAR
-    for (int i=0; i<NSCALARS; i++) {
-      scalar[i] = dev_conserved[(5+i)*n_cells + id];
-    }
-    #endif
-    #ifdef DE
-    ge = dev_conserved[(n_fields-1)*n_cells + id];
-    #endif
-
-    // send values back from the kernel
+    // Send the z+1/2 Left interface
     dev_bounds_Lz[            id] = d;
     dev_bounds_Lz[  n_cells + id] = mx;
     dev_bounds_Lz[2*n_cells + id] = my;
     dev_bounds_Lz[3*n_cells + id] = mz;
     dev_bounds_Lz[4*n_cells + id] = E;
     #ifdef SCALAR
-    for (int i=0; i<NSCALARS; i++) {
-      dev_bounds_Lz[(5+i)*n_cells + id] = scalar[i];
-    }
-    #endif
+      for (int i=0; i<NSCALARS; i++)
+      {
+        dev_bounds_Lz[(5+i)*n_cells + id] = scalar[i];
+      }
+    #endif  //SCALAR
+    #ifdef  MHD
+      dev_bounds_Lz[(5+NSCALARS)*n_cells + id] = cellCenteredBx;
+      dev_bounds_Lz[(6+NSCALARS)*n_cells + id] = cellCenteredBy;
+    #endif  //MHD
     #ifdef DE
-    dev_bounds_Lz[(n_fields-1)*n_cells + id] = ge;
-    #endif
-
-    // retrieve appropriate conserved variables
-    id = xid + yid*nx + (zid+1)*nx*ny;
-    d  = dev_conserved[            id];
-    mx = dev_conserved[  n_cells + id];
-    my = dev_conserved[2*n_cells + id];
-    mz = dev_conserved[3*n_cells + id];
-    E  = dev_conserved[4*n_cells + id];
-    #ifdef SCALAR
-    for (int i=0; i<NSCALARS; i++) {
-      scalar[i] = dev_conserved[(5+i)*n_cells + id];
+      dev_bounds_Lz[(n_fields-1)*n_cells + id] = ge;
+    #endif  //DE
+
+    // Send the x-1/2 Right interface
+    if (xid > 0)
+    {
+      id = cuda_utilities::compute1DIndex(xid-1, yid, zid, nx, ny);
+      dev_bounds_Rx[            id] = d;
+      dev_bounds_Rx[  n_cells + id] = mx;
+      dev_bounds_Rx[2*n_cells + id] = my;
+      dev_bounds_Rx[3*n_cells + id] = mz;
+      dev_bounds_Rx[4*n_cells + id] = E;
+      #ifdef SCALAR
+        for (int i=0; i<NSCALARS; i++)
+        {
+          dev_bounds_Rx[(5+i)*n_cells + id] = scalar[i];
+        }
+      #endif  //SCALAR
+      #ifdef  MHD
+        dev_bounds_Rx[(5+NSCALARS)*n_cells + id] = cellCenteredBy;
+        dev_bounds_Rx[(6+NSCALARS)*n_cells + id] = cellCenteredBz;
+      #endif  //MHD
+      #ifdef DE
+        dev_bounds_Rx[(n_fields-1)*n_cells + id] = ge;
+      #endif  //DE
     }
-    #endif
-    #ifdef DE
-    ge = dev_conserved[(n_fields-1)*n_cells + id];
-    #endif
 
-    // send values back from the kernel
-    id = xid + yid*nx + zid*nx*ny;
-    dev_bounds_Rz[            id] = d;
-    dev_bounds_Rz[  n_cells + id] = mx;
-    dev_bounds_Rz[2*n_cells + id] = my;
-    dev_bounds_Rz[3*n_cells + id] = mz;
-    dev_bounds_Rz[4*n_cells + id] = E;
-    #ifdef SCALAR
-    for (int i=0; i<NSCALARS; i++) {
-      dev_bounds_Rz[(5+i)*n_cells + id] = scalar[i];
+    if (yid > 0)
+    {
+      // Send the y-1/2 Right interface
+      id = cuda_utilities::compute1DIndex(xid, yid-1, zid, nx, ny);
+      dev_bounds_Ry[            id] = d;
+      dev_bounds_Ry[  n_cells + id] = mx;
+      dev_bounds_Ry[2*n_cells + id] = my;
+      dev_bounds_Ry[3*n_cells + id] = mz;
+      dev_bounds_Ry[4*n_cells + id] = E;
+      #ifdef SCALAR
+        for (int i=0; i<NSCALARS; i++)
+        {
+          dev_bounds_Ry[(5+i)*n_cells + id] = scalar[i];
+        }
+      #endif  //SCALAR
+      #ifdef  MHD
+        dev_bounds_Ry[(5+NSCALARS)*n_cells + id] = cellCenteredBz;
+        dev_bounds_Ry[(6+NSCALARS)*n_cells + id] = cellCenteredBx;
+      #endif  //MHD
+      #ifdef DE
+        dev_bounds_Ry[(n_fields-1)*n_cells + id] = ge;
+      #endif  //DE
+      }
+
+    if (zid > 0)
+    {
+      // Send the z-1/2 Right interface
+      id = cuda_utilities::compute1DIndex(xid, yid, zid-1, nx, ny);
+      dev_bounds_Rz[            id] = d;
+      dev_bounds_Rz[  n_cells + id] = mx;
+      dev_bounds_Rz[2*n_cells + id] = my;
+      dev_bounds_Rz[3*n_cells + id] = mz;
+      dev_bounds_Rz[4*n_cells + id] = E;
+      #ifdef SCALAR
+        for (int i=0; i<NSCALARS; i++)
+        {
+          dev_bounds_Rz[(5+i)*n_cells + id] = scalar[i];
+        }
+      #endif  //SCALAR
+      #ifdef  MHD
+        dev_bounds_Rz[(5+NSCALARS)*n_cells + id] = cellCenteredBx;
+        dev_bounds_Rz[(6+NSCALARS)*n_cells + id] = cellCenteredBy;
+      #endif  //MHD
+      #ifdef DE
+        dev_bounds_Rz[(n_fields-1)*n_cells + id] = ge;
+      #endif  //DE
     }
-    #endif
-    #ifdef DE
-    dev_bounds_Rz[(n_fields-1)*n_cells + id] = ge;
-    #endif
-
   }
 }
 
diff --git a/src/reconstruction/plmc_cuda.cu b/src/reconstruction/plmc_cuda.cu
index ea6b95aaa..2478fa123 100644
--- a/src/reconstruction/plmc_cuda.cu
+++ b/src/reconstruction/plmc_cuda.cu
@@ -13,7 +13,7 @@
 
 #ifdef DE //PRESSURE_DE
 #include "../utils/hydro_utilities.h"
-#endif
+#endif  //DE
 
 
 /*! \fn __global__ void PLMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bounds_R, int nx, int ny, int nz, int n_ghost, Real dx, Real dt, Real gamma, int dir)
@@ -70,8 +70,8 @@ __global__ void PLMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
   Real E, E_kin, dge;
   #ifndef VL
   Real sum_ge;
-  #endif // not VL
-  #endif
+  #endif //CTU
+  #endif  //DE
   #ifdef SCALAR
   Real scalar_i[NSCALARS], scalar_imo[NSCALARS], scalar_ipo[NSCALARS];
   Real del_scalar_L[NSCALARS], del_scalar_R[NSCALARS], del_scalar_C[NSCALARS], del_scalar_G[NSCALARS];
@@ -79,8 +79,8 @@ __global__ void PLMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
   Real scalar_L_iph[NSCALARS], scalar_R_imh[NSCALARS];
   #ifndef VL
   Real sum_scalar[NSCALARS];
-  #endif // not VL
-  #endif
+  #endif //CTU
+  #endif  //SCALAR
 
   // get a thread ID
   int blockId = blockIdx.x + blockIdx.y*gridDim.x;
@@ -122,7 +122,7 @@ __global__ void PLMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     E_kin = 0.5 * d_i * ( vx_i*vx_i + vy_i*vy_i + vz_i*vz_i );
     dge = dev_conserved[(n_fields-1)*n_cells + id];
     p_i = hydro_utilities::Get_Pressure_From_DE( E, E - E_kin, dge, gamma );
-    #else
+    #else  //not DE
     p_i  = (dev_conserved[4*n_cells + id] - 0.5*d_i*(vx_i*vx_i + vy_i*vy_i + vz_i*vz_i)) * (gamma - 1.0);
     #endif //PRESSURE_DE
     p_i  = fmax(p_i, (Real) TINY_NUMBER);
@@ -130,10 +130,10 @@ __global__ void PLMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     for (int i=0; i<NSCALARS; i++) {
       scalar_i[i] = dev_conserved[(5+i)*n_cells + id] / d_i;
     }
-    #endif
+    #endif  //SCALAR
     #ifdef DE
     ge_i =  dge / d_i;
-    #endif
+    #endif  //DE
     // cell i-1
     if (dir == 0) id = xid-1 + yid*nx + zid*nx*ny;
     if (dir == 1) id = xid + (yid-1)*nx + zid*nx*ny;
@@ -147,7 +147,7 @@ __global__ void PLMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     E_kin = 0.5 * d_imo * ( vx_imo*vx_imo + vy_imo*vy_imo + vz_imo*vz_imo );
     dge = dev_conserved[(n_fields-1)*n_cells + id];
     p_imo = hydro_utilities::Get_Pressure_From_DE( E, E - E_kin, dge, gamma );
-    #else
+    #else  //not DE
     p_imo  = (dev_conserved[4*n_cells + id] - 0.5*d_imo*(vx_imo*vx_imo + vy_imo*vy_imo + vz_imo*vz_imo)) * (gamma - 1.0);
     #endif //PRESSURE_DE
     p_imo  = fmax(p_imo, (Real) TINY_NUMBER);
@@ -155,10 +155,10 @@ __global__ void PLMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     for (int i=0; i<NSCALARS; i++) {
       scalar_imo[i] = dev_conserved[(5+i)*n_cells + id] / d_imo;
     }
-    #endif
+    #endif  //SCALAR
     #ifdef DE
     ge_imo =  dge / d_imo;
-    #endif
+    #endif  //DE
     // cell i+1
     if (dir == 0) id = xid+1 + yid*nx + zid*nx*ny;
     if (dir == 1) id = xid + (yid+1)*nx + zid*nx*ny;
@@ -172,7 +172,7 @@ __global__ void PLMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     E_kin = 0.5 * d_ipo * ( vx_ipo*vx_ipo + vy_ipo*vy_ipo + vz_ipo*vz_ipo );
     dge = dev_conserved[(n_fields-1)*n_cells + id];
     p_ipo = hydro_utilities::Get_Pressure_From_DE( E, E - E_kin, dge, gamma );
-    #else
+    #else  //not DE
     p_ipo  = (dev_conserved[4*n_cells + id] - 0.5*d_ipo*(vx_ipo*vx_ipo + vy_ipo*vy_ipo + vz_ipo*vz_ipo)) * (gamma - 1.0);
     #endif //PRESSURE_DE
     p_ipo  = fmax(p_ipo, (Real) TINY_NUMBER);
@@ -180,10 +180,10 @@ __global__ void PLMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     for (int i=0; i<NSCALARS; i++) {
       scalar_ipo[i] = dev_conserved[(5+i)*n_cells + id] / d_ipo;
     }
-    #endif
+    #endif  //SCALAR
     #ifdef DE
     ge_ipo =  dge / d_ipo;
-    #endif
+    #endif  //DE
 
 
     // calculate the adiabatic sound speed in cell i
@@ -196,7 +196,7 @@ __global__ void PLMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     lambda_m = vx_i-a_i;
     lambda_0 = vx_i;
     lambda_p = vx_i+a_i;
-    #endif
+    #endif  //VL
 
     // Compute the left, right, centered, and van Leer differences of the primitive variables
     // Note that here L and R refer to locations relative to the cell center
@@ -240,7 +240,7 @@ __global__ void PLMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     del_ge_C = 0.5*(ge_ipo - ge_imo);
     if (del_ge_L*del_ge_R > 0.0) { del_ge_G = 2.0*del_ge_L*del_ge_R / (del_ge_L+del_ge_R); }
     else { del_ge_G = 0.0; }
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       del_scalar_L[i] = scalar_i[i] - scalar_imo[i];
@@ -249,7 +249,7 @@ __global__ void PLMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
       if (del_scalar_L[i]*del_scalar_R[i] > 0.0) { del_scalar_G[i] = 2.0*del_scalar_L[i]*del_scalar_R[i] / (del_scalar_L[i]+del_scalar_R[i]); }
       else { del_scalar_G[i] = 0.0; }
     }
-    #endif
+    #endif  //SCALAR
 
 
     // Project the left, right, centered and van Leer differences onto the characteristic variables
@@ -316,7 +316,7 @@ __global__ void PLMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
       lim_slope_b = fmin(fabs(del_ge_C), fabs(del_ge_G));
       del_ge_m_i = sgn_CUDA(del_ge_C) * fmin(2.0*lim_slope_a, lim_slope_b);
     }
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       del_scalar_m_i[i] = 0.0;
@@ -326,7 +326,7 @@ __global__ void PLMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
         del_scalar_m_i[i] = sgn_CUDA(del_scalar_C[i]) * fmin(2.0*lim_slope_a, lim_slope_b);
       }
     }
-    #endif
+    #endif  //SCALAR
 
 
 
@@ -358,13 +358,13 @@ __global__ void PLMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     #ifdef DE
     ge_R_imh = ge_i - 0.5*del_ge_m_i;
     ge_L_iph = ge_i + 0.5*del_ge_m_i;
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       scalar_R_imh[i] = scalar_i[i] - 0.5*del_scalar_m_i[i];
       scalar_L_iph[i] = scalar_i[i] + 0.5*del_scalar_m_i[i];
     }
-    #endif
+    #endif  //SCALAR
 
 
     C = d_R_imh + d_L_iph;
@@ -422,7 +422,7 @@ __global__ void PLMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     ge_L_iph = fmin( fmax(ge_i, ge_ipo), ge_L_iph );
     ge_R_imh = C - ge_L_iph;
     del_ge_m_i = ge_L_iph - ge_R_imh;
-    #endif
+    #endif  //DE
 
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
@@ -435,7 +435,7 @@ __global__ void PLMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
       scalar_R_imh[i] = C - scalar_L_iph[i];
       del_scalar_m_i[i] = scalar_L_iph[i] - scalar_R_imh[i];
     }
-    #endif
+    #endif  //SCALAR
 
 
     #ifndef VL
@@ -458,14 +458,14 @@ __global__ void PLMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     #ifdef DE
     ge_R_imh = ge_R_imh + qx * del_ge_m_i;
     ge_L_iph = ge_L_iph - qx * del_ge_m_i;
-    #endif
+    #endif  //DE
 
     #ifdef  SCALAR
     for (int i=0; i<NSCALARS; i++) {
       scalar_R_imh[i] = scalar_R_imh[i] + qx * del_scalar_m_i[i];
       scalar_L_iph[i] = scalar_L_iph[i] - qx * del_scalar_m_i[i];
     }
-    #endif
+    #endif  //SCALAR
 
 
     // Perform the characteristic tracing
@@ -475,12 +475,12 @@ __global__ void PLMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     sum_0 = sum_1 = sum_2 = sum_3 = sum_4 = 0;
     #ifdef DE
     sum_ge = 0;
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       sum_scalar[i] = 0.0;
     }
-    #endif
+    #endif  //SCALAR
     if (lambda_m >= 0)
     {
       lamdiff = lambda_p - lambda_m;
@@ -498,12 +498,12 @@ __global__ void PLMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
       sum_3 += lamdiff * del_vz_m_i;
       #ifdef DE
       sum_ge += lamdiff * del_ge_m_i;
-      #endif
+      #endif  //DE
       #ifdef SCALAR
       for (int i=0; i<NSCALARS; i++) {
         sum_scalar[i] += lamdiff * del_scalar_m_i[i];
       }
-      #endif
+      #endif  //SCALAR
     }
     if (lambda_p >= 0)
     {
@@ -522,24 +522,24 @@ __global__ void PLMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     p_L_iph  += 0.5*dtodx*sum_4;
     #ifdef DE
     ge_L_iph += 0.5*dtodx*sum_ge;
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       scalar_L_iph[i] += 0.5*dtodx*sum_scalar[i];
     }
-    #endif
+    #endif  //SCALAR
 
 
     // right-hand interface value, i-1/2
     sum_0 = sum_1 = sum_2 = sum_3 = sum_4 = 0;
     #ifdef DE
     sum_ge = 0;
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       sum_scalar[i] = 0;
     }
-    #endif
+    #endif  //SCALAR
     if (lambda_m <= 0)
     {
       lamdiff = lambda_m - lambda_m;
@@ -557,12 +557,12 @@ __global__ void PLMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
       sum_3 += lamdiff * del_vz_m_i;
       #ifdef DE
       sum_ge += lamdiff * del_ge_m_i;
-      #endif
+      #endif  //DE
       #ifdef SCALAR
       for (int i=0; i<NSCALARS; i++) {
         sum_scalar[i] += lamdiff * del_scalar_m_i[i];
       }
-      #endif
+      #endif  //SCALAR
     }
     if (lambda_p <= 0)
     {
@@ -581,13 +581,13 @@ __global__ void PLMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     p_R_imh  += 0.5*dtodx*sum_4;
     #ifdef DE
     ge_R_imh += 0.5*dtodx*sum_ge;
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       scalar_R_imh[i] += 0.5*dtodx*sum_scalar[i];
     }
-    #endif
-    #endif // not VL
+    #endif  //SCALAR
+    #endif  //CTU
 
     // apply minimum constraints
     d_R_imh = fmax(d_R_imh, (Real) TINY_NUMBER);
@@ -610,10 +610,10 @@ __global__ void PLMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     for (int i=0; i<NSCALARS; i++) {
       dev_bounds_R[(5+i)*n_cells + id] = d_R_imh*scalar_R_imh[i];
     }
-    #endif
+    #endif  //SCALAR
     #ifdef DE
     dev_bounds_R[(n_fields-1)*n_cells + id] = d_R_imh*ge_R_imh;
-    #endif
+    #endif  //DE
     // bounds_L refers to the left side of the i+1/2 interface
     id = xid + yid*nx + zid*nx*ny;
     dev_bounds_L[            id] = d_L_iph;
@@ -625,10 +625,10 @@ __global__ void PLMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     for (int i=0; i<NSCALARS; i++) {
       dev_bounds_L[(5+i)*n_cells + id] = d_L_iph*scalar_L_iph[i];
     }
-    #endif
+    #endif  //SCALAR
     #ifdef DE
     dev_bounds_L[(n_fields-1)*n_cells + id] = d_L_iph*ge_L_iph;
-    #endif
+    #endif  //DE
 
   }
 }
diff --git a/src/reconstruction/plmp_cuda.cu b/src/reconstruction/plmp_cuda.cu
index 2a6b637f7..7e4ee6d25 100644
--- a/src/reconstruction/plmp_cuda.cu
+++ b/src/reconstruction/plmp_cuda.cu
@@ -46,22 +46,22 @@ __global__ void PLMP_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
 
   #ifdef DE
   Real ge_i, ge_imo, ge_ipo, ge_L, ge_R, dge_L, dge_R, E_kin, E, dge;
-  #endif
+  #endif  //DE
   #ifdef SCALAR
   Real scalar_i[NSCALARS], scalar_imo[NSCALARS], scalar_ipo[NSCALARS];
   Real scalar_L[NSCALARS], scalar_R[NSCALARS], dscalar_L[NSCALARS], dscalar_R[NSCALARS];
-  #endif
+  #endif  //SCALAR
 
   #ifndef VL //Don't use velocities to reconstruct when using VL
   Real dtodx = dt/dx;
   Real dfl, dfr, mxfl, mxfr, myfl, myfr, mzfl, mzfr, Efl, Efr;
   #ifdef DE
   Real gefl, gefr;
-  #endif
+  #endif  //DE
   #ifdef SCALAR
   Real scalarfl[NSCALARS], scalarfr[NSCALARS];
-  #endif
-  #endif
+  #endif  //SCALAR
+  #endif  //VL
 
   // get a thread ID
   int blockId = blockIdx.x + blockIdx.y*gridDim.x;
@@ -111,10 +111,10 @@ __global__ void PLMP_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     for (int i=0; i<NSCALARS; i++) {
       scalar_i[i] = dev_conserved[(5+i)*n_cells + id] / d_i;
     }
-    #endif
+    #endif  //SCALAR
     #ifdef DE
     ge_i = dge / d_i;
-    #endif
+    #endif  //DE
     // cell i-1
     if (dir == 0) id = xid-1 + yid*nx + zid*nx*ny;
     if (dir == 1) id = xid + (yid-1)*nx + zid*nx*ny;
@@ -136,10 +136,10 @@ __global__ void PLMP_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     for (int i=0; i<NSCALARS; i++) {
       scalar_imo[i] = dev_conserved[(5+i)*n_cells + id] / d_imo;
     }
-    #endif
+    #endif  //SCALAR
     #ifdef DE
     ge_imo = dge / d_imo;
-    #endif
+    #endif  //DE
     // cell i+1
     if (dir == 0) id = xid+1 + yid*nx + zid*nx*ny;
     if (dir == 1) id = xid + (yid+1)*nx + zid*nx*ny;
@@ -161,10 +161,10 @@ __global__ void PLMP_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     for (int i=0; i<NSCALARS; i++) {
       scalar_ipo[i] = dev_conserved[(5+i)*n_cells + id] / d_ipo;
     }
-    #endif
+    #endif  //SCALAR
     #ifdef DE
     ge_ipo =  dge / d_ipo;
-    #endif
+    #endif  //DE
 
 
     // Calculate the interface values for each primitive variable
@@ -175,12 +175,12 @@ __global__ void PLMP_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     Interface_Values_PLM(p_imo,  p_i,  p_ipo,  &p_L,  &p_R);
     #ifdef DE
     Interface_Values_PLM(ge_imo,  ge_i,  ge_ipo,  &ge_L,  &ge_R);
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       Interface_Values_PLM(scalar_imo[i],  scalar_i[i],  scalar_ipo[i],  &scalar_L[i],  &scalar_R[i]);
     }
-    #endif
+    #endif  //SCALAR
 
     // Apply mimimum constraints
     d_L = fmax(d_L, (Real) TINY_NUMBER);
@@ -200,13 +200,13 @@ __global__ void PLMP_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     #ifdef DE
     dge_L = d_L*ge_L;
     dge_R = d_R*ge_R;
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       dscalar_L[i] = d_L*scalar_L[i];
       dscalar_R[i] = d_R*scalar_R[i];
     }
-    #endif
+    #endif  //SCALAR
 
     // #ifdef CTU
     #ifndef VL //Don't use velocities to reconstruct when using VL
@@ -224,13 +224,13 @@ __global__ void PLMP_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     #ifdef DE
     gefl = dge_L*vx_L;
     gefr = dge_R*vx_R;
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       scalarfl[i] = dscalar_L[i]*vx_L;
       scalarfr[i] = dscalar_R[i]*vx_R;
     }
-    #endif
+    #endif  //SCALAR
 
     // Evolve the boundary extrapolated values half a timestep.
     d_L += 0.5 * (dtodx) * (dfl - dfr);
@@ -246,13 +246,13 @@ __global__ void PLMP_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     #ifdef DE
     dge_L += 0.5 * (dtodx) * (gefl - gefr);
     dge_R += 0.5 * (dtodx) * (gefl - gefr);
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       dscalar_L[i] += 0.5 * (dtodx) * (scalarfl[i] - scalarfr[i]);
       dscalar_R[i] += 0.5 * (dtodx) * (scalarfl[i] - scalarfr[i]);
     }
-    #endif
+    #endif  //SCALAR
 
     #endif //NO VL
 
@@ -271,10 +271,10 @@ __global__ void PLMP_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     for (int i=0; i<NSCALARS; i++) {
       dev_bounds_R[(5+i)*n_cells + id] = dscalar_L[i];
     }
-    #endif
+    #endif  //SCALAR
     #ifdef DE
     dev_bounds_R[(n_fields-1)*n_cells + id] = dge_L;
-    #endif
+    #endif  //DE
     // bounds_L refers to the left side of the i+1/2 interface
     id = xid + yid*nx + zid*nx*ny;
     dev_bounds_L[            id] = d_R;
@@ -286,10 +286,10 @@ __global__ void PLMP_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     for (int i=0; i<NSCALARS; i++) {
       dev_bounds_L[(5+i)*n_cells + id] = dscalar_R[i];
     }
-    #endif
+    #endif  //SCALAR
     #ifdef DE
     dev_bounds_L[(n_fields-1)*n_cells + id] = dge_R;
-    #endif
+    #endif  //DE
 
   }
 }
diff --git a/src/reconstruction/ppmc_cuda.cu b/src/reconstruction/ppmc_cuda.cu
index cc589a178..8f00b8a73 100644
--- a/src/reconstruction/ppmc_cuda.cu
+++ b/src/reconstruction/ppmc_cuda.cu
@@ -68,7 +68,7 @@ __global__ void PPMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
   Real A, B, C, D;
   Real chi_1, chi_2, chi_3, chi_4, chi_5;
   Real sum_1, sum_2, sum_3, sum_4, sum_5;
-  #endif //CTU
+  #endif //VL
 
   #ifdef DE
   Real ge_i, ge_imo, ge_ipo, ge_imt, ge_ipt;
@@ -79,8 +79,8 @@ __global__ void PPMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
   // #ifdef CTU
   #ifndef VL
   Real chi_ge, sum_ge, ge_6;
-  #endif
-  #endif
+  #endif  //VL
+  #endif //DE
   #ifdef SCALAR
   Real scalar_i[NSCALARS], scalar_imo[NSCALARS], scalar_ipo[NSCALARS], scalar_imt[NSCALARS], scalar_ipt[NSCALARS];
   Real del_scalar_L[NSCALARS], del_scalar_R[NSCALARS], del_scalar_C[NSCALARS], del_scalar_G[NSCALARS];
@@ -89,8 +89,8 @@ __global__ void PPMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
   // #ifdef CTU
   #ifndef VL
   Real chi_scalar[NSCALARS], sum_scalar[NSCALARS], scalar_6[NSCALARS];
-  #endif
-  #endif
+  #endif  //VL
+  #endif  //SCALAR
 
 
   // get a thread ID
@@ -132,18 +132,18 @@ __global__ void PPMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     E_kin = 0.5 * d_i * ( vx_i*vx_i + vy_i*vy_i + vz_i*vz_i );
     dge = dev_conserved[(n_fields-1)*n_cells + id];
     p_i = hydro_utilities::Get_Pressure_From_DE( E, E - E_kin, dge, gamma );
-    #else
+    #else  //not DE
     p_i  = (dev_conserved[4*n_cells + id] - 0.5*d_i*(vx_i*vx_i + vy_i*vy_i + vz_i*vz_i)) * (gamma - 1.0);
     #endif //PRESSURE_DE
     p_i  = fmax(p_i, (Real) TINY_NUMBER);
     #ifdef DE
     ge_i =  dge / d_i;
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       scalar_i[i] =  dev_conserved[(5+i)*n_cells + id] / d_i;
     }
-    #endif
+    #endif  //SCALAR
     // cell i-1
     if (dir == 0) id = xid-1 + yid*nx + zid*nx*ny;
     if (dir == 1) id = xid + (yid-1)*nx + zid*nx*ny;
@@ -157,18 +157,18 @@ __global__ void PPMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     E_kin = 0.5 * d_imo * ( vx_imo*vx_imo + vy_imo*vy_imo + vz_imo*vz_imo );
     dge = dev_conserved[(n_fields-1)*n_cells + id];
     p_imo = hydro_utilities::Get_Pressure_From_DE( E, E - E_kin, dge, gamma );
-    #else
+    #else  //not DE
     p_imo  = (dev_conserved[4*n_cells + id] - 0.5*d_imo*(vx_imo*vx_imo + vy_imo*vy_imo + vz_imo*vz_imo)) * (gamma - 1.0);
     #endif //PRESSURE_DE
     p_imo  = fmax(p_imo, (Real) TINY_NUMBER);
     #ifdef DE
     ge_imo =  dge / d_imo;
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       scalar_imo[i]  =  dev_conserved[(5+i)*n_cells + id] / d_imo;
     }
-    #endif
+    #endif  //SCALAR
     // cell i+1
     if (dir == 0) id = xid+1 + yid*nx + zid*nx*ny;
     if (dir == 1) id = xid + (yid+1)*nx + zid*nx*ny;
@@ -182,18 +182,18 @@ __global__ void PPMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     E_kin = 0.5 * d_ipo * ( vx_ipo*vx_ipo + vy_ipo*vy_ipo + vz_ipo*vz_ipo );
     dge = dev_conserved[(n_fields-1)*n_cells + id];
     p_ipo = hydro_utilities::Get_Pressure_From_DE( E, E - E_kin, dge, gamma );
-    #else
+    #else  //not DE
     p_ipo  = (dev_conserved[4*n_cells + id] - 0.5*d_ipo*(vx_ipo*vx_ipo + vy_ipo*vy_ipo + vz_ipo*vz_ipo)) * (gamma - 1.0);
     #endif //PRESSURE_DE
     p_ipo  = fmax(p_ipo, (Real) TINY_NUMBER);
     #ifdef DE
     ge_ipo =  dge / d_ipo;
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       scalar_ipo[i]  =  dev_conserved[(5+i)*n_cells + id] / d_ipo;
     }
-    #endif
+    #endif  //SCALAR
     // cell i-2
     if (dir == 0) id = xid-2 + yid*nx + zid*nx*ny;
     if (dir == 1) id = xid + (yid-2)*nx + zid*nx*ny;
@@ -207,18 +207,18 @@ __global__ void PPMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     E_kin = 0.5 * d_imt * ( vx_imt*vx_imt + vy_imt*vy_imt + vz_imt*vz_imt );
     dge = dev_conserved[(n_fields-1)*n_cells + id];
     p_imt = hydro_utilities::Get_Pressure_From_DE( E, E - E_kin, dge, gamma );
-    #else
+    #else  //not DE
     p_imt  = (dev_conserved[4*n_cells + id] - 0.5*d_imt*(vx_imt*vx_imt + vy_imt*vy_imt + vz_imt*vz_imt)) * (gamma - 1.0);
     #endif //PRESSURE_DE
     p_imt  = fmax(p_imt, (Real) TINY_NUMBER);
     #ifdef DE
     ge_imt =  dge / d_imt;
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       scalar_imt[i]  =  dev_conserved[(5+i)*n_cells + id] / d_imt;
     }
-    #endif
+    #endif  //SCALAR
     // cell i+2
     if (dir == 0) id = xid+2 + yid*nx + zid*nx*ny;
     if (dir == 1) id = xid + (yid+2)*nx + zid*nx*ny;
@@ -232,18 +232,18 @@ __global__ void PPMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     E_kin = 0.5 * d_ipt * ( vx_ipt*vx_ipt + vy_ipt*vy_ipt + vz_ipt*vz_ipt );
     dge = dev_conserved[(n_fields-1)*n_cells + id];
     p_ipt = hydro_utilities::Get_Pressure_From_DE( E, E - E_kin, dge, gamma );
-    #else
+    #else  //not DE
     p_ipt  = (dev_conserved[4*n_cells + id] - 0.5*d_ipt*(vx_ipt*vx_ipt + vy_ipt*vy_ipt + vz_ipt*vz_ipt)) * (gamma - 1.0);
     #endif //PRESSURE_DE
     p_ipt  = fmax(p_ipt, (Real) TINY_NUMBER);
     #ifdef DE
     ge_ipt =  dge / d_ipt;
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       scalar_ipt[i]  =  dev_conserved[(5+i)*n_cells + id] / d_ipt;
     }
-    #endif
+    #endif  //SCALAR
 
     //printf("%d %d %d %f %f %f %f %f\n", xid, yid, zid, d_i, vx_i, vy_i, vz_i, p_i);
 
@@ -294,7 +294,7 @@ __global__ void PPMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     del_ge_C  = 0.5*(ge_i - ge_imt);
     if (del_ge_L*del_ge_R > 0.0) { del_ge_G = 2.0*del_ge_L*del_ge_R / (del_ge_L+del_ge_R); }
     else { del_ge_G = 0.0; }
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       del_scalar_L[i]  = scalar_imo[i]  - scalar_imt[i];
@@ -303,7 +303,7 @@ __global__ void PPMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
       if (del_scalar_L[i]*del_scalar_R[i] > 0.0) { del_scalar_G[i] = 2.0*del_scalar_L[i]*del_scalar_R[i] / (del_scalar_L[i]+del_scalar_R[i]); }
       else { del_scalar_G[i] = 0.0; }
     }
-    #endif
+    #endif  //SCALAR
 
 
     // Step 3 - Project the left, right, centered and van Leer differences onto the characteristic variables
@@ -372,7 +372,7 @@ __global__ void PPMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
       del_ge_m_imo = sgn_CUDA(del_ge_C) * fmin((Real) 2.0*lim_slope_a, lim_slope_b);
     }
     else del_ge_m_imo = 0.0;
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       if (del_scalar_L[i]*del_scalar_R[i] > 0.0) {
@@ -382,7 +382,7 @@ __global__ void PPMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
       }
       else del_scalar_m_imo[i] = 0.0;
     }
-    #endif
+    #endif  //SCALAR
 
 
     // Step 5 - Project the monotonized difference in the characteristic variables back onto the
@@ -442,7 +442,7 @@ __global__ void PPMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     del_ge_C = 0.5*(ge_ipo - ge_imo);
     if (del_ge_L*del_ge_R > 0.0) { del_ge_G = 2.0*del_ge_L*del_ge_R / (del_ge_L+del_ge_R); }
     else { del_ge_G = 0.0; }
-    #endif
+    #endif  //DE
 
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
@@ -452,7 +452,7 @@ __global__ void PPMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
       if (del_scalar_L[i]*del_scalar_R[i] > 0.0) { del_scalar_G[i] = 2.0*del_scalar_L[i]*del_scalar_R[i] / (del_scalar_L[i]+del_scalar_R[i]); }
       else { del_scalar_G[i] = 0.0; }
     }
-    #endif
+    #endif  //SCALAR
 
     // Step 3 - Project the left, right, centered, and van Leer differences onto the characteristic variables
     //          Stone Eqn 37 (del_a are differences in characteristic variables, see Stone for notation)
@@ -520,7 +520,7 @@ __global__ void PPMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
       del_ge_m_i = sgn_CUDA(del_ge_C) * fmin((Real) 2.0*lim_slope_a, lim_slope_b);
     }
     else del_ge_m_i = 0.0;
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       if (del_scalar_L[i]*del_scalar_R[i] > 0.0) {
@@ -530,7 +530,7 @@ __global__ void PPMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
       }
       else del_scalar_m_i[i] = 0.0;
     }
-    #endif
+    #endif  //SCALAR
 
 
     // Step 5 - Project the monotonized difference in the characteristic variables back onto the
@@ -591,7 +591,7 @@ __global__ void PPMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     del_ge_C = 0.5*(ge_ipt- ge_i);
     if (del_ge_L*del_ge_R > 0.0) { del_ge_G = 2.0*del_ge_L*del_ge_R / (del_ge_L+del_ge_R); }
     else { del_ge_G = 0.0; }
-    #endif
+    #endif  //DE
 
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
@@ -601,7 +601,7 @@ __global__ void PPMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
       if (del_scalar_L[i]*del_scalar_R[i] > 0.0) { del_scalar_G[i] = 2.0*del_scalar_L[i]*del_scalar_R[i] / (del_scalar_L[i]+del_scalar_R[i]); }
       else { del_scalar_G[i] = 0.0; }
     }
-    #endif
+    #endif  //SCALAR
 
 
     // Step 3 - Project the left, right, centered, and van Leer differences onto the characteristic variables
@@ -670,7 +670,7 @@ __global__ void PPMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
       del_ge_m_ipo = sgn_CUDA(del_ge_C) * fmin((Real) 2.0*lim_slope_a, lim_slope_b);
     }
     else del_ge_m_ipo = 0.0;
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       if (del_scalar_L[i]*del_scalar_R[i] > 0.0) {
@@ -680,7 +680,7 @@ __global__ void PPMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
       }
       else del_scalar_m_ipo[i] = 0.0;
     }
-    #endif
+    #endif  //SCALAR
 
 
     // Step 5 - Project the monotonized difference in the characteristic variables back onto the
@@ -713,13 +713,13 @@ __global__ void PPMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     #ifdef DE
     ge_L  = 0.5*(ge_i + ge_imo)   - (del_ge_m_i  - del_ge_m_imo)  / 6.0;
     ge_R  = 0.5*(ge_ipo + ge_i)   - (del_ge_m_ipo  - del_ge_m_i)  / 6.0;
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       scalar_L[i]  = 0.5*(scalar_i[i] + scalar_imo[i])   - (del_scalar_m_i[i]  - del_scalar_m_imo[i])  / 6.0;
       scalar_R[i]  = 0.5*(scalar_ipo[i] + scalar_i[i])   - (del_scalar_m_ipo[i]  - del_scalar_m_i[i])  / 6.0;
     }
-    #endif
+    #endif  //SCALAR
 
 
     // Step 7 - Apply further monotonicity constraints to ensure the values on the left and right side
@@ -773,7 +773,7 @@ __global__ void PPMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     ge_L  = fmin( fmax(ge_i,  ge_imo), ge_L );
     ge_R  = fmax( fmin(ge_i,  ge_ipo), ge_R );
     ge_R  = fmin( fmax(ge_i,  ge_ipo), ge_R );
-    #endif
+    #endif  //DE
 
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
@@ -785,7 +785,7 @@ __global__ void PPMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
       scalar_R[i]  = fmax( fmin(scalar_i[i],  scalar_ipo[i]), scalar_R[i] );
       scalar_R[i]  = fmin( fmax(scalar_i[i],  scalar_ipo[i]), scalar_R[i] );
     }
-    #endif
+    #endif  //SCALAR
 
     // #ifdef CTU
     #ifndef VL
@@ -808,14 +808,14 @@ __global__ void PPMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     #ifdef DE
     del_ge_m_i = ge_R - ge_L;
     ge_6 = 6.0*(ge_i - 0.5*(ge_L + ge_R));
-    #endif
+    #endif  //DE
 
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       del_scalar_m_i[i] = scalar_R[i] - scalar_L[i];
       scalar_6[i] = 6.0*(scalar_i[i] - 0.5*(scalar_L[i] + scalar_R[i]));
     }
-    #endif
+    #endif  //SCALAR
 
 
     // Compute the eigenvalues of the linearized equations in the
@@ -855,14 +855,14 @@ __global__ void PPMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     #ifdef DE
     ge_R = ge_R - lambda_max * (0.5*dtodx)*(del_ge_m_i - (1.0 - (2.0/3.0)*lambda_max*dtodx)*ge_6);
     ge_L = ge_L - lambda_min * (0.5*dtodx)*(del_ge_m_i + (1.0 + (2.0/3.0)*lambda_min*dtodx)*ge_6);
-    #endif
+    #endif  //DE
 
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       scalar_R[i] = scalar_R[i] - lambda_max * (0.5*dtodx)*(del_scalar_m_i[i] - (1.0 - (2.0/3.0)*lambda_max*dtodx)*scalar_6[i]);
       scalar_L[i] = scalar_L[i] - lambda_min * (0.5*dtodx)*(del_scalar_m_i[i] + (1.0 + (2.0/3.0)*lambda_min*dtodx)*scalar_6[i]);
     }
-    #endif
+    #endif  //SCALAR
 
     // Step 10 - Perform the characteristic tracing
     //           Stone Eqns 57 - 60
@@ -875,12 +875,12 @@ __global__ void PPMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     sum_5 = 0;
     #ifdef DE
     sum_ge = 0;
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       sum_scalar[i] = 0;
     }
-    #endif
+    #endif  //SCALAR
 
     if (lambda_m >= 0)
     {
@@ -909,24 +909,24 @@ __global__ void PPMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
       chi_5 = A*(del_p_m_i - p_6) + B*p_6;
       #ifdef DE
       chi_ge = A*(del_ge_m_i - ge_6) + B*ge_6;
-      #endif
+      #endif  //DE
       #ifdef SCALAR
       for (int i=0; i<NSCALARS; i++) {
         chi_scalar[i] = A*(del_scalar_m_i[i] - scalar_6[i]) + B*scalar_6[i];
       }
-      #endif
+      #endif  //SCALAR
 
       sum_1 += chi_1 - chi_5/(a*a);
       sum_3 += chi_3;
       sum_4 += chi_4;
       #ifdef DE
       sum_ge += chi_ge;
-      #endif
+      #endif  //DE
       #ifdef SCALAR
       for (int i=0; i<NSCALARS; i++) {
         sum_scalar[i] += chi_scalar[i];
       }
-      #endif
+      #endif  //SCALAR
     }
     if (lambda_p >= 0)
     {
@@ -952,12 +952,12 @@ __global__ void PPMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     p_R += sum_5;
     #ifdef DE
     ge_R += sum_ge;
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       scalar_R[i] += sum_scalar[i];
     }
-    #endif
+    #endif  //SCALAR
 
     // right-hand interface value, i-1/2
     sum_1 = 0;
@@ -967,12 +967,12 @@ __global__ void PPMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     sum_5 = 0;
     #ifdef DE
     sum_ge = 0;
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       sum_scalar[i] = 0;
     }
-    #endif
+    #endif  //SCALAR
     if (lambda_m <= 0)
     {
       C = (0.5*dtodx) * (lambda_m - lambda_m);
@@ -1000,24 +1000,24 @@ __global__ void PPMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
       chi_5 = C*(del_p_m_i + p_6) + D*p_6;
       #ifdef DE
       chi_ge = C*(del_ge_m_i + ge_6) + D*ge_6;
-      #endif
+      #endif  //DE
       #ifdef SCALAR
       for (int i=0; i<NSCALARS; i++) {
         chi_scalar[i] = C*(del_scalar_m_i[i] + scalar_6[i]) + D*scalar_6[i];
       }
-      #endif
+      #endif  //SCALAR
 
       sum_1 += chi_1 - chi_5/(a*a);
       sum_3 += chi_3;
       sum_4 += chi_4;
       #ifdef DE
       sum_ge += chi_ge;
-      #endif
+      #endif  //DE
       #ifdef SCALAR
       for (int i=0; i<NSCALARS; i++) {
         sum_scalar[i] += chi_scalar[i];
       }
-      #endif
+      #endif  //SCALAR
     }
     if (lambda_p <= 0)
     {
@@ -1043,14 +1043,14 @@ __global__ void PPMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     p_L += sum_5;
     #ifdef DE
     ge_L += sum_ge;
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       scalar_L[i] += sum_scalar[i];
     }
-    #endif
+    #endif  //SCALAR
 
-    #endif //CTU
+    #endif //VL, i.e. CTU was used for this section
 
     // enforce minimum values
     d_L = fmax(d_L, (Real) TINY_NUMBER);
@@ -1073,10 +1073,10 @@ __global__ void PPMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     for (int i=0; i<NSCALARS; i++) {
       dev_bounds_R[(5+i)*n_cells + id] = d_L*scalar_L[i];
     }
-    #endif
+    #endif  //SCALAR
     #ifdef DE
     dev_bounds_R[(n_fields-1)*n_cells + id] = d_L*ge_L;
-    #endif
+    #endif  //DE
     // bounds_L refers to the left side of the i+1/2 interface
     id = xid + yid*nx + zid*nx*ny;
     dev_bounds_L[            id] = d_R;
@@ -1088,10 +1088,10 @@ __global__ void PPMC_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     for (int i=0; i<NSCALARS; i++) {
       dev_bounds_L[(5+i)*n_cells + id] = d_R*scalar_R[i];
     }
-    #endif
+    #endif  //SCALAR
     #ifdef DE
     dev_bounds_L[(n_fields-1)*n_cells + id] = d_R*ge_R;
-    #endif
+    #endif  //DE
 
   }
 }
diff --git a/src/reconstruction/ppmp_cuda.cu b/src/reconstruction/ppmp_cuda.cu
index ccd1f5a87..828c53744 100644
--- a/src/reconstruction/ppmp_cuda.cu
+++ b/src/reconstruction/ppmp_cuda.cu
@@ -43,7 +43,7 @@ __global__ void PPMP_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
   Real d_ipt, vx_ipt, vy_ipt, vz_ipt, p_ipt;
   #ifdef FLATTENING
   Real p_imth, p_ipth;
-  #endif
+  #endif  //FLATTENING
 
   // declare left and right interface values
   Real d_L, vx_L, vy_L, vz_L, p_L;
@@ -68,15 +68,15 @@ __global__ void PPMP_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
   Real dR_p, vxR_p, pR_p;
   Real chi_L_m, chi_L_0, chi_L_p;
   Real chi_R_m, chi_R_0, chi_R_p;
-  #endif
+  #endif  //CTU
 
   #ifdef DE
   Real ge_i, ge_imo, ge_ipo, ge_imt, ge_ipt, ge_L, ge_R, E_kin, E, dge;
   #ifndef VL
 //  #ifdef CTU
   Real del_ge, ge_6, geL_0, geR_0;
-  #endif
-  #endif
+  #endif  //CTU
+  #endif  //DE
 
   #ifdef SCALAR
   Real scalar_i[NSCALARS], scalar_imo[NSCALARS], scalar_ipo[NSCALARS], scalar_imt[NSCALARS], scalar_ipt[NSCALARS];
@@ -84,8 +84,8 @@ __global__ void PPMP_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
   #ifndef VL
 //  #ifdef CTU
   Real del_scalar[NSCALARS], scalar_6[NSCALARS], scalarL_0[NSCALARS], scalarR_0[NSCALARS];
-  #endif
-  #endif
+  #endif  //CTU
+  #endif  //SCALAR
 
 
 
@@ -153,12 +153,12 @@ __global__ void PPMP_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     p_i  = fmax(p_i, (Real) TINY_NUMBER);
     #ifdef DE
     ge_i = dge / d_i;
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       scalar_i[i] =  dev_conserved[(5+i)*n_cells + id] / d_i;
     }
-    #endif
+    #endif  //SCALAR
     // cell i-1
     if (dir == 0) id = xid-1 + yid*nx + zid*nx*ny;
     if (dir == 1) id = xid + (yid-1)*nx + zid*nx*ny;
@@ -178,12 +178,12 @@ __global__ void PPMP_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     p_imo  = fmax(p_imo, (Real) TINY_NUMBER);
     #ifdef DE
     ge_imo = dge / d_imo;
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       scalar_imo[i]  =  dev_conserved[(5+i)*n_cells + id] / d_imo;
     }
-    #endif
+    #endif  //SCALAR
     // cell i+1
     if (dir == 0) id = xid+1 + yid*nx + zid*nx*ny;
     if (dir == 1) id = xid + (yid+1)*nx + zid*nx*ny;
@@ -203,12 +203,12 @@ __global__ void PPMP_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     p_ipo  = fmax(p_ipo, (Real) TINY_NUMBER);
     #ifdef DE
     ge_ipo = dge / d_ipo;
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       scalar_ipo[i]  =  dev_conserved[(5+i)*n_cells + id] / d_ipo;
     }
-    #endif
+    #endif  //SCALAR
     // cell i-2
     if (dir == 0) id = xid-2 + yid*nx + zid*nx*ny;
     if (dir == 1) id = xid + (yid-2)*nx + zid*nx*ny;
@@ -228,12 +228,12 @@ __global__ void PPMP_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     p_imt  = fmax(p_imt, (Real) TINY_NUMBER);
     #ifdef DE
     ge_imt = dge / d_imt;
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       scalar_imt[i]  =  dev_conserved[(5+i)*n_cells + id] / d_imt;
     }
-    #endif
+    #endif  //SCALAR
     // cell i+2
     if (dir == 0) id = xid+2 + yid*nx + zid*nx*ny;
     if (dir == 1) id = xid + (yid+2)*nx + zid*nx*ny;
@@ -253,12 +253,12 @@ __global__ void PPMP_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     p_ipt  = fmax(p_ipt, (Real) TINY_NUMBER);
     #ifdef DE
     ge_ipt = dge / d_ipt;
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       scalar_ipt[i]  =  dev_conserved[(5+i)*n_cells + id] / d_ipt;
     }
-    #endif
+    #endif  //SCALAR
     #ifdef FLATTENING
     // cell i-3
     if (dir == 0) id = xid-3 + yid*nx + zid*nx*ny;
@@ -330,7 +330,7 @@ __global__ void PPMP_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
 
     // Calculate the interface values for internal energy
     Interface_Values_PPM(ge_imo,  ge_i,  ge_ipo,  del_q_imo, del_q_i, del_q_ipo, &ge_L,  &ge_R);
-    #endif
+    #endif  //DE
 
     #ifdef SCALAR
     // Calculate the monotonized slopes for cells imo, i, ipo (passive scalars)
@@ -342,7 +342,7 @@ __global__ void PPMP_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
       // Calculate the interface values for the passive scalars
       Interface_Values_PPM(scalar_imo[i],  scalar_i[i],  scalar_ipo[i],  del_q_imo, del_q_i, del_q_ipo, &scalar_L[i],  &scalar_R[i]);
     }
-    #endif
+    #endif  //SCALAR
 
 #ifdef STEEPENING
     Real d2_rho_imo, d2_rho_ipo, eta_i;
@@ -375,7 +375,7 @@ __global__ void PPMP_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
         }
       }
     }
-#endif
+#endif  //STEEPENING
 
 #ifdef FLATTENING
     Real F_imo, F_i, F_ipo;
@@ -403,12 +403,12 @@ __global__ void PPMP_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     p_L  = F_i * p_i  + (1 - F_i) * p_L;
     #ifdef DE
     ge_L = F_i * ge_i + (1 - F_i) * ge_L;
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       scalar_L[i] = F_i * scalar_i[i] + (1 - F_i) * scalar_L[i];
     }
-    #endif
+    #endif  //SCALAR
     d_R  = F_i * d_i  + (1 - F_i) * d_R;
     vx_R = F_i * vx_i + (1 - F_i) * vx_R;
     vy_R = F_i * vy_i + (1 - F_i) * vy_R;
@@ -416,13 +416,13 @@ __global__ void PPMP_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     p_R  = F_i * p_i  + (1 - F_i) * p_R;
     #ifdef DE
     ge_R = F_i * ge_i + (1 - F_i) * ge_R;
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       scalar_R[i] = F_i * scalar_i[i] + (1 - F_i) * scalar_R[i];
     }
-    #endif
-#endif
+    #endif  //SCALAR
+#endif  //FLATTENING
 
 #ifndef VL
 //#ifdef CTU
@@ -440,12 +440,12 @@ __global__ void PPMP_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     del_p  = p_R  - p_L;
     #ifdef DE
     del_ge = ge_R - ge_L;
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       del_scalar[i] = scalar_R[i] - scalar_L[i];
     }
-    #endif
+    #endif  //SCALAR
 
     d_6  = 6.0 * (d_i  - 0.5*(d_L  + d_R));  // Fryxell Eqn 30
     vx_6 = 6.0 * (vx_i - 0.5*(vx_L + vx_R)); // Fryxell Eqn 30
@@ -454,12 +454,12 @@ __global__ void PPMP_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     p_6  = 6.0 * (p_i  - 0.5*(p_L  + p_R));  // Fryxell Eqn 30
     #ifdef DE
     ge_6 = 6.0 * (ge_i - 0.5*(ge_L + ge_R)); // Fryxell Eqn 30
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       scalar_6[i] = 6.0 * (scalar_i[i] - 0.5*(scalar_L[i] + scalar_R[i])); // Fryxell Eqn 30
     }
-    #endif
+    #endif  //SCALAR
 
     // set speed of characteristics (v-c, v, v+c) using average values of v and c
     lambda_m = vx_i - cs;
@@ -485,12 +485,12 @@ __global__ void PPMP_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     vzL_0 = vz_L + 0.5 * alpha_0 * (del_vz + vz_6 * (1 - (2./3.) * alpha_0));
     #ifdef DE
     geL_0 = ge_L + 0.5 * alpha_0 * (del_ge + ge_6 * (1 - (2./3.) * alpha_0));
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       scalarL_0[i] = scalar_L[i] + 0.5 * alpha_0 * (del_scalar[i] + scalar_6[i] * (1 - (2./3.) * alpha_0));
     }
-    #endif
+    #endif  //SCALAR
     pL_0  = p_L  + 0.5 * alpha_0 * (del_p  + p_6  * (1 - (2./3.) * alpha_0));
     vxL_p = vx_L + 0.5 * alpha_p * (del_vx + vx_6 * (1 - (2./3.) * alpha_p));
     pL_p  = p_L  + 0.5 * alpha_p * (del_p  + p_6  * (1 - (2./3.) * alpha_p));
@@ -503,12 +503,12 @@ __global__ void PPMP_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     vzR_0 = vz_R - 0.5 * beta_0 * (del_vz - vz_6 * (1 - (2./3.) * beta_0));
     #ifdef DE
     geR_0 = ge_R - 0.5 * beta_0 * (del_ge - ge_6 * (1 - (2./3.) * beta_0));
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       scalarR_0[i] = scalar_R[i] - 0.5 * beta_0 * (del_scalar[i] - scalar_6[i] * (1 - (2./3.) * beta_0));
     }
-    #endif
+    #endif  //SCALAR
     pR_0  = p_R  - 0.5 * beta_0 * (del_p  - p_6  * (1 - (2./3.) * beta_0));
     dR_p  = d_R  - 0.5 * beta_p * (del_d  - d_6  * (1 - (2./3.) * beta_p));
     vxR_p = vx_R - 0.5 * beta_p * (del_vx - vx_6 * (1 - (2./3.) * beta_p));
@@ -524,12 +524,12 @@ __global__ void PPMP_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     p_L  = pL_m;
     #ifdef DE
     ge_L = geL_0;
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       scalar_L[i] = scalarL_0[i];
     }
-    #endif
+    #endif  //SCALAR
     // right
     d_R  = dR_p;
     vx_R = vxR_p;
@@ -538,12 +538,12 @@ __global__ void PPMP_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     p_R  = pR_p;
     #ifdef DE
     ge_R = geR_0;
-    #endif
+    #endif  //DE
     #ifdef SCALAR
     for (int i=0; i<NSCALARS; i++) {
       scalar_R[i] = scalarR_0[i];
     }
-    #endif
+    #endif  //SCALAR
 
     // correct these initial guesses by taking into account the number of
     // characteristics on each side of the interface
@@ -599,10 +599,10 @@ __global__ void PPMP_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     for (int i=0; i<NSCALARS; i++) {
       dev_bounds_R[(5+i)*n_cells + id] = d_L*scalar_L[i];
     }
-    #endif
+    #endif  //SCALAR
     #ifdef DE
     dev_bounds_R[(n_fields-1)*n_cells + id] = d_L*ge_L;
-    #endif
+    #endif  //DE
     // bounds_L refers to the left side of the i+1/2 interface
     id = xid + yid*nx + zid*nx*ny;
     dev_bounds_L[            id] = d_R;
@@ -614,10 +614,10 @@ __global__ void PPMP_cuda(Real *dev_conserved, Real *dev_bounds_L, Real *dev_bou
     for (int i=0; i<NSCALARS; i++) {
       dev_bounds_L[(5+i)*n_cells + id] = d_R*scalar_R[i];
     }
-    #endif
+    #endif  //SCALAR
     #ifdef DE
     dev_bounds_L[(n_fields-1)*n_cells + id] = d_R*ge_R;
-    #endif
+    #endif  //DE
 
   }
 }
diff --git a/src/riemann_solvers/hlld_cuda.cu b/src/riemann_solvers/hlld_cuda.cu
index 489647bdb..ca20fdb1f 100644
--- a/src/riemann_solvers/hlld_cuda.cu
+++ b/src/riemann_solvers/hlld_cuda.cu
@@ -11,17 +11,27 @@
 #include "../utils/gpu.hpp"
 #include "../global/global.h"
 #include "../global/global_cuda.h"
+#include "../utils/hydro_utilities.h"
 #include "../utils/mhd_utilities.h"
 #include "../riemann_solvers/hlld_cuda.h"
+#include "../utils/cuda_utilities.h"
+#include "../utils/math_utilities.h"
 
 #ifdef DE //PRESSURE_DE
     #include "../utils/hydro_utilities.h"
 #endif // DE
 
 #ifdef CUDA
+/*!
+ * \brief Namespace for MHD code
+ *
+ */
+namespace mhd
+{
     // =========================================================================
     __global__ void Calculate_HLLD_Fluxes_CUDA(Real *dev_bounds_L,
                                                Real *dev_bounds_R,
+                                               Real *dev_magnetic_face,
                                                Real *dev_flux,
                                                int nx,
                                                int ny,
@@ -34,9 +44,8 @@
         // get a thread index
         int blockId  = blockIdx.x + blockIdx.y*gridDim.x;
         int threadId = threadIdx.x + blockId * blockDim.x;
-        int zid = threadId / (nx*ny);
-        int yid = (threadId - zid*nx*ny) / nx;
-        int xid = threadId - zid*nx*ny - yid*nx;
+        int xid, yid, zid;
+        cuda_utilities::compute3DIndices(threadId, nx, ny, xid, yid, zid);
 
         // Number of cells
         int n_cells = nx*ny*nz;
@@ -48,20 +57,24 @@
         if (direction==2) {o1 = 3; o2 = 1; o3 = 2;}
 
         // Thread guard to avoid overrun
-        if (xid < nx and yid < ny and zid < nz)
+        if (xid < nx and
+            yid < ny and
+            zid < nz)
         {
             // ============================
             // Retrieve conserved variables
             // ============================
+            // The magnetic field in the X-direction
+            Real magneticX = dev_magnetic_face[threadId];
+
             // Left interface
             Real densityL   = dev_bounds_L[threadId];
             Real momentumXL = dev_bounds_L[threadId + n_cells * o1];
             Real momentumYL = dev_bounds_L[threadId + n_cells * o2];
             Real momentumZL = dev_bounds_L[threadId + n_cells * o3];
             Real energyL    = dev_bounds_L[threadId + n_cells * 4];
-            Real magneticXL = dev_bounds_L[threadId + n_cells * (o1 + 4 + NSCALARS)];
-            Real magneticYL = dev_bounds_L[threadId + n_cells * (o2 + 4 + NSCALARS)];
-            Real magneticZL = dev_bounds_L[threadId + n_cells * (o3 + 4 + NSCALARS)];
+            Real magneticYL = dev_bounds_L[threadId + n_cells * (5 + NSCALARS)];
+            Real magneticZL = dev_bounds_L[threadId + n_cells * (6 + NSCALARS)];
 
             #ifdef SCALAR
                 Real scalarConservedL[NSCALARS];
@@ -80,9 +93,8 @@
             Real momentumYR = dev_bounds_R[threadId + n_cells * o2];
             Real momentumZR = dev_bounds_R[threadId + n_cells * o3];
             Real energyR    = dev_bounds_R[threadId + n_cells * 4];
-            Real magneticXR = dev_bounds_R[threadId + n_cells * (o1 + 4 + NSCALARS)];
-            Real magneticYR = dev_bounds_R[threadId + n_cells * (o2 + 4 + NSCALARS)];
-            Real magneticZR = dev_bounds_R[threadId + n_cells * (o3 + 4 + NSCALARS)];
+            Real magneticYR = dev_bounds_R[threadId + n_cells * (5 + NSCALARS)];
+            Real magneticZR = dev_bounds_R[threadId + n_cells * (6 + NSCALARS)];
 
             #ifdef SCALAR
                 Real scalarConservedR[NSCALARS];
@@ -110,35 +122,30 @@
             Real const velocityZL = momentumZL / densityL;
 
             #ifdef DE //PRESSURE_DE
-                Real const energyKineticL = 0.5 * densityL
-                    * _hlldInternal::_dotProduct(velocityXL, velocityYL, velocityZL,
-                                                 velocityXL, velocityYL, velocityZL);
-
-                Real const energyMagneticL = 0.5
-                    * _hlldInternal::_dotProduct(magneticXL, magneticYL, magneticZL,
-                                                 magneticXL, magneticYL, magneticZL);
+                Real energyNonThermal =   hydro_utilities::Calc_Kinetic_Energy_From_Velocity(densityL, velocityXL, velocityYL, velocityZL)
+                                        + mhd::utils::computeMagneticEnergy(magneticX, magneticYL, magneticZL);
 
                 Real const gasPressureL   = fmax(hydro_utilities::Get_Pressure_From_DE(energyL,
-                                                                      energyL - energyKineticL - energyMagneticL,
+                                                                      energyL - energyNonThermal,
                                                                       thermalEnergyConservedL,
                                                                       gamma),
                                                  (Real) TINY_NUMBER);
             #else
                 // Note that this function does the positive pressure check
                 // internally
-                Real const gasPressureL  = mhdUtils::computeGasPressure(energyL,
+                Real const gasPressureL  = mhd::utils::computeGasPressure(energyL,
                                                                         densityL,
                                                                         momentumXL,
                                                                         momentumYL,
                                                                         momentumZL,
-                                                                        magneticXL,
+                                                                        magneticX,
                                                                         magneticYL,
                                                                         magneticZL,
                                                                         gamma);
             #endif //PRESSURE_DE
 
-            Real const totalPressureL = mhdUtils::computeTotalPressure(gasPressureL,
-                                                                       magneticXL,
+            Real const totalPressureL = mhd::utils::computeTotalPressure(gasPressureL,
+                                                                       magneticX,
                                                                        magneticYL,
                                                                        magneticZL);
 
@@ -148,42 +155,37 @@
             Real const velocityZR = momentumZR / densityR;
 
             #ifdef DE //PRESSURE_DE
-                Real const energyKineticR = 0.5 * densityR
-                    * _hlldInternal::_dotProduct(velocityXR, velocityYR, velocityZR,
-                                                 velocityXR, velocityYR, velocityZR);
-
-                Real const energyMagneticR = 0.5
-                    * _hlldInternal::_dotProduct(magneticXR, magneticYR, magneticZR,
-                                                 magneticXR, magneticYR, magneticZR);
+                energyNonThermal =   hydro_utilities::Calc_Kinetic_Energy_From_Velocity(densityR, velocityXR, velocityYR, velocityZR)
+                                   + mhd::utils::computeMagneticEnergy(magneticX, magneticYR, magneticZR);
 
                 Real const gasPressureR   = fmax(hydro_utilities::Get_Pressure_From_DE(energyR,
-                                                                      energyR - energyKineticR - energyMagneticR,
+                                                                      energyR - energyNonThermal,
                                                                       thermalEnergyConservedR,
                                                                       gamma),
                                                  (Real) TINY_NUMBER);
             #else
                 // Note that this function does the positive pressure check
                 // internally
-                Real const gasPressureR  = mhdUtils::computeGasPressure(energyR,
+                Real const gasPressureR  = mhd::utils::computeGasPressure(energyR,
                                                                   densityR,
                                                                   momentumXR,
                                                                   momentumYR,
                                                                   momentumZR,
-                                                                  magneticXR,
+                                                                  magneticX,
                                                                   magneticYR,
                                                                   magneticZR,
                                                                   gamma);
             #endif //PRESSURE_DE
 
-            Real const totalPressureR = mhdUtils::computeTotalPressure(gasPressureR,
-                                                                 magneticXR,
+            Real const totalPressureR = mhd::utils::computeTotalPressure(gasPressureR,
+                                                                 magneticX,
                                                                  magneticYR,
                                                                  magneticZR);
 
             // Compute the approximate wave speeds and density in the star
             // regions
             Real speedL, speedR, speedM, speedStarL, speedStarR, densityStarL, densityStarR;
-            _hlldInternal::_approximateWaveSpeeds(densityL,
+            mhd::_internal::_approximateWaveSpeeds(densityL,
                                                   momentumXL,
                                                   momentumYL,
                                                   momentumZL,
@@ -192,7 +194,7 @@
                                                   velocityZL,
                                                   gasPressureL,
                                                   totalPressureL,
-                                                  magneticXL,
+                                                  magneticX,
                                                   magneticYL,
                                                   magneticZL,
                                                   densityR,
@@ -204,7 +206,6 @@
                                                   velocityZR,
                                                   gasPressureR,
                                                   totalPressureR,
-                                                  magneticXR,
                                                   magneticYR,
                                                   magneticZR,
                                                   gamma,
@@ -222,13 +223,13 @@
             // Left state
             Real densityFluxL, momentumFluxXL, momentumFluxYL, momentumFluxZL,
                  magneticFluxYL, magneticFluxZL, energyFluxL;
-            _hlldInternal::_nonStarFluxes(momentumXL,
+            mhd::_internal::_nonStarFluxes(momentumXL,
                                           velocityXL,
                                           velocityYL,
                                           velocityZL,
                                           totalPressureL,
                                           energyL,
-                                          magneticXL,
+                                          magneticX,
                                           magneticYL,
                                           magneticZL,
                                           densityFluxL,
@@ -243,7 +244,7 @@
             // In this state the flow is supersonic
             if (speedL >= 0.0)
             {
-                _hlldInternal::_returnFluxes(threadId, o1, o2, o3, n_cells,
+                mhd::_internal::_returnFluxes(threadId, o1, o2, o3, n_cells,
                                              dev_flux,
                                              densityFluxL,
                                              momentumFluxXL, momentumFluxYL, momentumFluxZL,
@@ -263,13 +264,13 @@
             // Right state
             Real densityFluxR, momentumFluxXR, momentumFluxYR, momentumFluxZR,
                  magneticFluxYR, magneticFluxZR, energyFluxR;
-            _hlldInternal::_nonStarFluxes(momentumXR,
+            mhd::_internal::_nonStarFluxes(momentumXR,
                                           velocityXR,
                                           velocityYR,
                                           velocityZR,
                                           totalPressureR,
                                           energyR,
-                                          magneticXR,
+                                          magneticX,
                                           magneticYR,
                                           magneticZR,
                                           densityFluxR,
@@ -284,7 +285,7 @@
             // In this state the flow is supersonic
             if (speedR <= 0.0)
             {
-                _hlldInternal::_returnFluxes(threadId, o1, o2, o3, n_cells,
+                mhd::_internal::_returnFluxes(threadId, o1, o2, o3, n_cells,
                                              dev_flux,
                                              densityFluxR,
                                              momentumFluxXR, momentumFluxYR, momentumFluxZR,
@@ -317,7 +318,7 @@
                  densityStarFluxL,
                  momentumStarFluxXL, momentumStarFluxYL, momentumStarFluxZL,
                  magneticStarFluxYL, magneticStarFluxZL, energyStarFluxL;
-            _hlldInternal::_starFluxes(speedM,
+            mhd::_internal::_starFluxes(speedM,
                                        speedL,
                                        densityL,
                                        velocityXL,
@@ -328,7 +329,7 @@
                                        momentumZL,
                                        energyL,
                                        totalPressureL,
-                                       magneticXL,
+                                       magneticX,
                                        magneticYL,
                                        magneticZL,
                                        densityStarL,
@@ -357,7 +358,7 @@
             // In this state the flow is subsonic
             if (speedStarL >= 0.0)
             {
-                _hlldInternal::_returnFluxes(threadId, o1, o2, o3, n_cells,
+                mhd::_internal::_returnFluxes(threadId, o1, o2, o3, n_cells,
                                              dev_flux,
                                              densityStarFluxL,
                                              momentumStarFluxXL, momentumStarFluxYL, momentumStarFluxZL,
@@ -381,7 +382,7 @@
                  densityStarFluxR,
                  momentumStarFluxXR, momentumStarFluxYR, momentumStarFluxZR,
                  magneticStarFluxYR, magneticStarFluxZR, energyStarFluxR;
-            _hlldInternal::_starFluxes(speedM,
+            mhd::_internal::_starFluxes(speedM,
                                        speedR,
                                        densityR,
                                        velocityXR,
@@ -392,7 +393,7 @@
                                        momentumZR,
                                        energyR,
                                        totalPressureR,
-                                       magneticXR,
+                                       magneticX,
                                        magneticYR,
                                        magneticZR,
                                        densityStarR,
@@ -421,7 +422,7 @@
             // In this state the flow is subsonic
             if (speedStarR <= 0.0)
             {
-                _hlldInternal::_returnFluxes(threadId, o1, o2, o3, n_cells,
+                mhd::_internal::_returnFluxes(threadId, o1, o2, o3, n_cells,
                                              dev_flux,
                                              densityStarFluxR,
                                              momentumStarFluxXR, momentumStarFluxYR, momentumStarFluxZR,
@@ -445,8 +446,8 @@
             Real velocityDoubleStarY, velocityDoubleStarZ,
                  magneticDoubleStarY, magneticDoubleStarZ,
                  energyDoubleStarL, energyDoubleStarR;
-            _hlldInternal::_doubleStarState(speedM,
-                                            magneticXL,
+            mhd::_internal::_doubleStarState(speedM,
+                                            magneticX,
                                             totalPressureStar,
                                             densityStarL,
                                             velocityStarYL,
@@ -473,7 +474,7 @@
                 Real momentumDoubleStarFluxX, momentumDoubleStarFluxY, momentumDoubleStarFluxZ,
                      energyDoubleStarFlux,
                      magneticDoubleStarFluxY, magneticDoubleStarFluxZ;
-                _hlldInternal::_doubleStarFluxes(speedStarL,
+                mhd::_internal::_doubleStarFluxes(speedStarL,
                                                  momentumStarFluxXL,
                                                  momentumStarFluxYL,
                                                  momentumStarFluxZL,
@@ -500,7 +501,7 @@
                                                  magneticDoubleStarFluxY,
                                                  magneticDoubleStarFluxZ);
 
-                _hlldInternal::_returnFluxes(threadId, o1, o2, o3, n_cells,
+                mhd::_internal::_returnFluxes(threadId, o1, o2, o3, n_cells,
                                              dev_flux,
                                              densityStarFluxL,
                                              momentumDoubleStarFluxX, momentumDoubleStarFluxY, momentumDoubleStarFluxZ,
@@ -525,7 +526,7 @@
                 Real momentumDoubleStarFluxX, momentumDoubleStarFluxY, momentumDoubleStarFluxZ,
                      energyDoubleStarFlux,
                      magneticDoubleStarFluxY, magneticDoubleStarFluxZ;
-                _hlldInternal::_doubleStarFluxes(speedStarR,
+                mhd::_internal::_doubleStarFluxes(speedStarR,
                                                  momentumStarFluxXR,
                                                  momentumStarFluxYR,
                                                  momentumStarFluxZR,
@@ -552,7 +553,7 @@
                                                  magneticDoubleStarFluxY,
                                                  magneticDoubleStarFluxZ);
 
-                _hlldInternal::_returnFluxes(threadId, o1, o2, o3, n_cells,
+                mhd::_internal::_returnFluxes(threadId, o1, o2, o3, n_cells,
                                              dev_flux,
                                              densityStarFluxR,
                                              momentumDoubleStarFluxX, momentumDoubleStarFluxY, momentumDoubleStarFluxZ,
@@ -575,7 +576,7 @@
     };
     // =========================================================================
 
-    namespace _hlldInternal
+    namespace _internal
     {
         // =====================================================================
         __device__ __host__ void _approximateWaveSpeeds(Real const &densityL,
@@ -587,7 +588,7 @@
                                                         Real const &velocityZL,
                                                         Real const &gasPressureL,
                                                         Real const &totalPressureL,
-                                                        Real const &magneticXL,
+                                                        Real const &magneticX,
                                                         Real const &magneticYL,
                                                         Real const &magneticZL,
                                                         Real const &densityR,
@@ -599,7 +600,6 @@
                                                         Real const &velocityZR,
                                                         Real const &gasPressureR,
                                                         Real const &totalPressureR,
-                                                        Real const &magneticXR,
                                                         Real const &magneticYR,
                                                         Real const &magneticZR,
                                                         Real const &gamma,
@@ -612,15 +612,15 @@
                                                         Real &densityStarR)
         {
             // Get the fast magnetosonic wave speeds
-            Real magSonicL = mhdUtils::fastMagnetosonicSpeed(densityL,
+            Real magSonicL = mhd::utils::fastMagnetosonicSpeed(densityL,
                                                              gasPressureL,
-                                                             magneticXL,
+                                                             magneticX,
                                                              magneticYL,
                                                              magneticZL,
                                                              gamma);
-            Real magSonicR = mhdUtils::fastMagnetosonicSpeed(densityR,
+            Real magSonicR = mhd::utils::fastMagnetosonicSpeed(densityR,
                                                              gasPressureR,
-                                                             magneticXR,
+                                                             magneticX,
                                                              magneticYR,
                                                              magneticZR,
                                                              gamma);
@@ -646,8 +646,8 @@
             densityStarR = densityR * (speedR - velocityXR) / (speedR - speedM);
 
             // Compute the S_L^* and S_R^* wave speeds
-            speedStarL = speedM - mhdUtils::alfvenSpeed(magneticXL, densityStarL);
-            speedStarR = speedM + mhdUtils::alfvenSpeed(magneticXR, densityStarR);
+            speedStarL = speedM - mhd::utils::alfvenSpeed(magneticX, densityStarL);
+            speedStarR = speedM + mhd::utils::alfvenSpeed(magneticX, densityStarR);
         }
         // =====================================================================
 
@@ -701,13 +701,13 @@
                                                 Real const &magneticFluxY,
                                                 Real const &magneticFluxZ)
         {
-            dev_flux[threadId]                                 = densityFlux;
-            dev_flux[threadId + n_cells * o1]                  = momentumFluxX;
-            dev_flux[threadId + n_cells * o2]                  = momentumFluxY;
-            dev_flux[threadId + n_cells * o3]                  = momentumFluxZ;
-            dev_flux[threadId + n_cells * 4]                   = energyFlux;
-            dev_flux[threadId + n_cells * (o2 + 4 + NSCALARS)] = magneticFluxY;
-            dev_flux[threadId + n_cells * (o3 + 4 + NSCALARS)] = magneticFluxZ;
+            dev_flux[threadId]                            = densityFlux;
+            dev_flux[threadId + n_cells * o1]             = momentumFluxX;
+            dev_flux[threadId + n_cells * o2]             = momentumFluxY;
+            dev_flux[threadId + n_cells * o3]             = momentumFluxZ;
+            dev_flux[threadId + n_cells * 4]              = energyFlux;
+            dev_flux[threadId + n_cells * (5 + NSCALARS)] = magneticFluxY;
+            dev_flux[threadId + n_cells * (6 + NSCALARS)] = magneticFluxZ;
         }
         // =====================================================================
 
@@ -752,7 +752,7 @@
             if (fabs(density * (speedSide - velocityX)
                              * (speedSide - speedM)
                              - (magneticX * magneticX))
-                < totalPressureStar * _hlldInternal::_hlldSmallNumber)
+                < totalPressureStar * mhd::_internal::_hlldSmallNumber)
             {
                 velocityStarY = velocityY;
                 velocityStarZ = velocityZ;
@@ -780,8 +780,8 @@
             energyStar = ( energy * (speedSide - velocityX)
                         - totalPressure * velocityX
                         + totalPressureStar * speedM
-                        + magneticX * (_hlldInternal::_dotProduct(velocityX, velocityY, velocityZ, magneticX, magneticY, magneticZ)
-                                     - _hlldInternal::_dotProduct(speedM, velocityStarY, velocityStarZ, magneticX, magneticStarY, magneticStarZ)))
+                        + magneticX * (math_utils::dotProduct(velocityX, velocityY, velocityZ, magneticX, magneticY, magneticZ)
+                                     - math_utils::dotProduct(speedM, velocityStarY, velocityStarZ, magneticX, magneticStarY, magneticStarZ)))
                         / (speedSide - speedM);
 
             // Now compute the star state fluxes
@@ -819,7 +819,7 @@
                                                   Real &energyDoubleStarR)
         {
             // if Bx is zero then just return the star state
-            if (magneticX < _hlldInternal::_hlldSmallNumber * totalPressureStar)
+            if (magneticX < mhd::_internal::_hlldSmallNumber * totalPressureStar)
             {
                 velocityDoubleStarY = velocityStarYL;
                 velocityDoubleStarZ = velocityStarZL;
@@ -856,17 +856,17 @@
                                       + magXSign * (sqrtDL * sqrtDR) * (velocityStarZR - velocityStarZL));
 
                 // Double star energy
-                Real velDblStarDotMagDblStar = _hlldInternal::_dotProduct(speedM,
+                Real velDblStarDotMagDblStar = math_utils::dotProduct(speedM,
                                                                           velocityDoubleStarY,
                                                                           velocityDoubleStarZ,
                                                                           magneticX,
                                                                           magneticDoubleStarY,
                                                                           magneticDoubleStarZ);
                 energyDoubleStarL = energyStarL - sqrtDL * magXSign
-                    * (_hlldInternal::_dotProduct(speedM, velocityStarYL, velocityStarZL, magneticX, magneticStarYL, magneticStarZL)
+                    * (math_utils::dotProduct(speedM, velocityStarYL, velocityStarZL, magneticX, magneticStarYL, magneticStarZL)
                     - velDblStarDotMagDblStar);
                 energyDoubleStarR = energyStarR + sqrtDR * magXSign
-                    * (_hlldInternal::_dotProduct(speedM, velocityStarYR, velocityStarZR, magneticX, magneticStarYR, magneticStarZR)
+                    * (math_utils::dotProduct(speedM, velocityStarYR, velocityStarZR, magneticX, magneticStarYR, magneticStarZR)
                     - velDblStarDotMagDblStar);
             }
         }
@@ -909,7 +909,7 @@
         }
         // =====================================================================
 
-    } // _hlldInternal namespace
-
+    } // mhd::_internal namespace
+} // end namespace mhd
 
 #endif // CUDA
\ No newline at end of file
diff --git a/src/riemann_solvers/hlld_cuda.h b/src/riemann_solvers/hlld_cuda.h
index d8d58dce1..357c850d6 100644
--- a/src/riemann_solvers/hlld_cuda.h
+++ b/src/riemann_solvers/hlld_cuda.h
@@ -13,23 +13,32 @@
 #include "../global/global.h"
 
 #ifdef CUDA
-
+/*!
+ * \brief Namespace for MHD code
+ *
+ */
+namespace mhd
+{
     /*!
      * \brief Compute the HLLD fluxes from Miyoshi & Kusano 2005
      *
-     * \param[in]  dev_bounds_L
-     * \param[in]  dev_bounds_R
-     * \param[out] dev_flux
-     * \param[in]  nx
-     * \param[in]  ny
-     * \param[in]  nz
-     * \param[in]  n_ghost
-     * \param[in]  gamma
-     * \param[in]  dir
-     * \param[in]  n_fields
+     * \param[in]  dev_bounds_L The interface states on the left side of the interface
+     * \param[in]  dev_bounds_R The interface states on the right side of the interface
+     * \param[in]  dev_magnetic_face A pointer to the begining of the conserved
+     * magnetic field array that is stored at the interface. I.e. for the
+     * X-direction solve this would be the begining of the X-direction fields
+     * \param[out] dev_flux The output flux
+     * \param[in]  nx Number of cells in the X-direction
+     * \param[in]  ny Number of cells in the Y-direction
+     * \param[in]  nz Number of cells in the Z-direction
+     * \param[in]  n_ghost Number of ghost cells on each side
+     * \param[in]  gamma The adiabatic index
+     * \param[in]  dir The direction that the solve is taking place in. 0=X, 1=Y, 2=Z
+     * \param[in]  n_fields The total number of fields
      */
     __global__ void Calculate_HLLD_Fluxes_CUDA(Real *dev_bounds_L,
                                                Real *dev_bounds_R,
+                                               Real *dev_magnetic_face,
                                                Real *dev_flux,
                                                int nx,
                                                int ny,
@@ -44,7 +53,7 @@
      * solver
      *
      */
-    namespace _hlldInternal
+    namespace _internal
     {
         /*!
          * \brief Used for some comparisons. Value was chosen to match what is
@@ -65,7 +74,7 @@
          * \param[in] velocityZL Velocity in the Z-direction, left side
          * \param[in] gasPressureL Gas pressure, left side
          * \param[in] totalPressureL Total MHD pressure, left side
-         * \param[in] magneticXL Magnetic field in the X-direction, left side
+         * \param[in] magneticX Magnetic field in the X-direction, left side
          * \param[in] magneticYL Magnetic field in the Y-direction, left side
          * \param[in] magneticZL Magnetic field in the Z-direction, left side
          * \param[in] densityR Density, right side
@@ -77,7 +86,6 @@
          * \param[in] velocityZR Velocity in the Z-direction, right side
          * \param[in] gasPressureR Gas pressure, right side
          * \param[in] totalPressureR Total MHD pressure, right side
-         * \param[in] magneticXR Magnetic field in the X-direction, right side
          * \param[in] magneticYR Magnetic field in the Y-direction, right side
          * \param[in] magneticZR Magnetic field in the Z-direction, right side
          * \param[in] gamma Adiabatic index
@@ -98,7 +106,7 @@
                                                         Real const &velocityZL,
                                                         Real const &gasPressureL,
                                                         Real const &totalPressureL,
-                                                        Real const &magneticXL,
+                                                        Real const &magneticX,
                                                         Real const &magneticYL,
                                                         Real const &magneticZL,
                                                         Real const &densityR,
@@ -110,7 +118,6 @@
                                                         Real const &velocityZR,
                                                         Real const &gasPressureR,
                                                         Real const &totalPressureR,
-                                                        Real const &magneticXR,
                                                         Real const &magneticYR,
                                                         Real const &magneticZR,
                                                         Real const &gamma,
@@ -266,26 +273,6 @@
                                              Real &magneticStarFluxY,
                                              Real &magneticStarFluxZ);
 
-        /*!
-         * \brief Compute the dot product of a and b.
-         *
-         * \param[in] a1 The first element of a
-         * \param[in] a2 The second element of a
-         * \param[in] a3 The third element of a
-         * \param[in] b1 The first element of b
-         * \param[in] b2 The second element of b
-         * \param[in] b3 The third element of b
-         *
-         * \return Real The dot product of a and b
-         */
-        inline __device__ __host__ Real _dotProduct(Real const &a1,
-                                                    Real const &a2,
-                                                    Real const &a3,
-                                                    Real const &b1,
-                                                    Real const &b2,
-                                                    Real const &b3)
-        {return a1*b1 + ((a2*b2) + (a3*b3));};
-
         /*!
          * \brief Compute the double star state
          *
@@ -390,6 +377,6 @@
                                                    Real &magneticDoubleStarFluxY,
                                                    Real &magneticDoubleStarFluxZ);
 
-    } // _hlldInternal namespace
-
+    } // end namespace mhd::_internal
+} // end namespace mhd
 #endif //CUDA
diff --git a/src/riemann_solvers/hlld_cuda_tests.cu b/src/riemann_solvers/hlld_cuda_tests.cu
index 754c2dba0..c39116d7a 100644
--- a/src/riemann_solvers/hlld_cuda_tests.cu
+++ b/src/riemann_solvers/hlld_cuda_tests.cu
@@ -21,7 +21,7 @@
 #include "../utils/mhd_utilities.h"
 #include "../riemann_solvers/hlld_cuda.h"   // Include code to test
 
-#if defined(CUDA) && defined(HLLD)
+#ifdef CUDA
     // =========================================================================
     // Integration tests for the entire HLLD solver. Unit tests are below
     // =========================================================================
@@ -59,15 +59,23 @@
                                         int const &direction=0)
         {
 
-            // Rearrange X, Y, and Z values if a different direction is chosen
-            // besides default
-            stateLeft  = _cycleXYZ(stateLeft, direction);
-            stateRight = _cycleXYZ(stateRight, direction);
+            // Rearrange X, Y, and Z values for the chosen direction
+            std::rotate(stateLeft.begin() + 1, stateLeft.begin() + 4 - direction, stateLeft.begin() + 4);
+            std::rotate(stateRight.begin()+ 1, stateRight.begin()+ 4 - direction, stateRight.begin()+ 4);
+
+            // Create new vectors that store the values in the way that the HLLD
+            // solver expects
+            size_t const magXIndex = 5+NSCALARS;
+            EXPECT_DOUBLE_EQ(stateLeft.at(magXIndex), stateRight.at(magXIndex))
+                << "The left and right magnetic fields are not equal";
+            std::vector<Real> const magneticX{stateLeft.at(magXIndex)};
+            stateLeft.erase(stateLeft.begin() + magXIndex);
+            stateRight.erase(stateRight.begin() + magXIndex);
 
             // Simulation Paramters
-            int const nx        = 1;  // Number of cells in the x-direction?
-            int const ny        = 1;  // Number of cells in the y-direction?
-            int const nz        = 1;  // Number of cells in the z-direction?
+            int const nx        = 1;  // Number of cells in the x-direction
+            int const ny        = 1;  // Number of cells in the y-direction
+            int const nz        = 1;  // Number of cells in the z-direction
             int const nGhost    = 0;  // Isn't actually used it appears
             int nFields         = 8;  // Total number of conserved fields
             #ifdef  SCALAR
@@ -83,33 +91,40 @@
 
             // Create the std::vector to store the fluxes and declare the device
             // pointers
-            std::vector<Real> testFlux(nFields);
+            std::vector<Real> testFlux(nFields-1, 0);
             Real *devConservedLeft;
             Real *devConservedRight;
+            Real *devConservedMagXFace;
             Real *devTestFlux;
 
             // Allocate device arrays and copy data
-            CudaSafeCall(cudaMalloc(&devConservedLeft,  nFields*sizeof(Real)));
-            CudaSafeCall(cudaMalloc(&devConservedRight, nFields*sizeof(Real)));
-            CudaSafeCall(cudaMalloc(&devTestFlux,       nFields*sizeof(Real)));
+            CudaSafeCall(cudaMalloc(&devConservedLeft,     stateLeft.size()*sizeof(Real)));
+            CudaSafeCall(cudaMalloc(&devConservedRight,   stateRight.size()*sizeof(Real)));
+            CudaSafeCall(cudaMalloc(&devConservedMagXFace, magneticX.size()*sizeof(Real)));
+            CudaSafeCall(cudaMalloc(&devTestFlux,           testFlux.size()*sizeof(Real)));
 
             CudaSafeCall(cudaMemcpy(devConservedLeft,
                          stateLeft.data(),
-                         nFields*sizeof(Real),
+                         stateLeft.size()*sizeof(Real),
                          cudaMemcpyHostToDevice));
             CudaSafeCall(cudaMemcpy(devConservedRight,
                          stateRight.data(),
-                         nFields*sizeof(Real),
+                         stateRight.size()*sizeof(Real),
+                         cudaMemcpyHostToDevice));
+            CudaSafeCall(cudaMemcpy(devConservedMagXFace,
+                         magneticX.data(),
+                         magneticX.size()*sizeof(Real),
                          cudaMemcpyHostToDevice));
 
             // Run kernel
-            hipLaunchKernelGGL(Calculate_HLLD_Fluxes_CUDA,
+            hipLaunchKernelGGL(mhd::Calculate_HLLD_Fluxes_CUDA,
                                dimGrid,
                                dimBlock,
                                0,
                                0,
                                devConservedLeft,   // the "left" interface
                                devConservedRight,  // the "right" interface
+                               devConservedMagXFace,  // the magnetic field at the interface
                                devTestFlux,
                                nx,
                                ny,
@@ -122,13 +137,25 @@
             CudaCheckError();
             CudaSafeCall(cudaMemcpy(testFlux.data(),
                                     devTestFlux,
-                                    nFields*sizeof(Real),
+                                    testFlux.size()*sizeof(Real),
                                     cudaMemcpyDeviceToHost));
 
             // Make sure to sync with the device so we have the results
             cudaDeviceSynchronize();
             CudaCheckError();
 
+            // Free device arrays
+            cudaFree(devConservedLeft);
+            cudaFree(devConservedRight);
+            cudaFree(devConservedMagXFace);
+            cudaFree(devTestFlux);
+
+            // The HLLD solver only writes the the first two "slots" for
+            // magnetic flux so let's rearrange to make sure we have all the
+            // magnetic fluxes in the right spots
+            testFlux.insert(testFlux.begin() + magXIndex, 0.0);
+            std::rotate(testFlux.begin() + 1, testFlux.begin() + 1 + direction, testFlux.begin() + 4);  // Rotate momentum
+
             return testFlux;
         }
         // =====================================================================
@@ -185,10 +212,6 @@
                                     scalarFlux.begin() + NSCALARS);
             #endif  //SCALAR
 
-            // Rearrange X, Y, and Z values if a different direction is chosen
-            // besides default
-            fiducialFlux = _cycleXYZ(fiducialFlux, direction);
-
             ASSERT_TRUE(    (fiducialFlux.size() == testFlux.size())
                         and (fiducialFlux.size() == fieldNames.size()))
                 << "The fiducial flux, test flux, and field name vectors are not all the same length" << std::endl
@@ -242,7 +265,7 @@
             output.at(1) = input.at(1) * input.at(0);  // X Velocity to momentum
             output.at(2) = input.at(2) * input.at(0);  // Y Velocity to momentum
             output.at(3) = input.at(3) * input.at(0);  // Z Velocity to momentum
-            output.at(4) = mhdUtils::computeEnergy(input.at(4),
+            output.at(4) = mhd::utils::computeEnergy(input.at(4),
                                                    input.at(0),
                                                    input.at(1),
                                                    input.at(2),
@@ -266,7 +289,7 @@
                               conservedScalar.begin() + NSCALARS);
             #endif //SCALAR
             #ifdef  DE
-                output.push_back(mhdUtils::computeThermalEnergy(output.at(4),
+                output.push_back(mhd::utils::computeThermalEnergy(output.at(4),
                                                                 output.at(0),
                                                                 output.at(1),
                                                                 output.at(2),
@@ -294,52 +317,6 @@
         }
         // =====================================================================
     private:
-        // =====================================================================
-        /*!
-         * \brief Cyclically permute the vector quantities in the list of
-         * conserved variables so that the same interfaces and fluxes can be
-         * used to test the HLLD solver in all 3 directions.
-         *
-         * \param[in,out] conservedVec The std::vector of conserved variables to
-         * be cyclically permutated
-         * \param[in] direction Which plane the interface is. 0 = plane normal
-         * to X, 1 = plane normal to Y, 2 = plane normal to Z
-         *
-         * \return std::vector<Real> The cyclically permutated list of conserved
-         * variables
-         */
-        std::vector<Real> inline _cycleXYZ(std::vector<Real> conservedVec,
-                                           int const &direction)
-        {
-            switch (direction)
-            {
-            case 0:  // Plane normal to X. Default case, do nothing
-                ;
-                break;
-            case 1:  // Plane normal to Y
-            case 2:  // Plane normal to Z
-                // Fall through for both Y and Z normal planes
-                {
-                    size_t shift = 3 - direction;
-                    auto momentumBegin = conservedVec.begin()+1;
-                    auto magneticBegin = conservedVec.begin()+5;
-                    #ifdef  SCALAR
-                        magneticBegin += NSCALARS;
-                    #endif  //SCALAR
-
-                    std::rotate(momentumBegin, momentumBegin+shift, momentumBegin+3);
-                    std::rotate(magneticBegin, magneticBegin+shift, magneticBegin+3);
-                }
-                break;
-            default:
-                throw std::invalid_argument(("Invalid Value of `direction`"
-                    " passed to `_cycleXYZ`. Value passed was "
-                     + std::to_string(direction) + ", should be 0, 1, or 2."));
-                break;
-            }
-            return conservedVec;
-        }
-        // =====================================================================
     };
     // =========================================================================
 
@@ -1525,6 +1502,61 @@
     }
     // =========================================================================
 
+    // =========================================================================
+    /*!
+    * \brief Test the HLLD Riemann Solver using the constant states from the
+    * examples in cholla/examples/3D
+    *
+    */
+    TEST_F(tMHDCalculateHLLDFluxesCUDA,
+           ConstantStatesExpectCorrectFlux)
+    {
+        // Constant Values
+        Real const gamma = 5./3.;
+
+        std::vector<Real> const primitiveScalar{1.1069975296, 2.2286185018, 3.3155141875};
+
+        // States
+        std::vector<Real> const                   // | Density | X-Velocity | Y-Velocity | Z-Velocity | Pressure    | X-Magnetic Field | Y-Magnetic Field | Z-Magnetic Field | Adiabatic Index | Passive Scalars |
+        zeroMagneticField       = primitive2Conserved({1e4,      0.0,         0.0,         0.0,         1.380658E-5,  0.0,               0.0,               0.0},               gamma,            primitiveScalar),
+        onesMagneticField       = primitive2Conserved({1e4,      0.0,         0.0,         0.0,         1.380658E-5,  1.0,               1.0,               1.0},               gamma,            primitiveScalar);
+
+        for (size_t direction = 2; direction < 3; direction++)
+        {
+            {
+                std::string const outputString {"Left State:  Constant state, zero magnetic field\n"
+                                                "Right State: Constant state, zero magnetic field\n"
+                                                "HLLD State: Left Star"};
+                // Compute the fluxes and check for correctness
+                // Order of Fluxes is rho, vec(V), E, vec(B)
+                std::vector<Real> const fiducialFlux{0,1.380658e-05,0,0,0,0,0,0};
+                std::vector<Real> const scalarFlux{0,0,0};
+                Real thermalEnergyFlux = 0.;
+                std::vector<Real> const testFluxes = computeFluxes(zeroMagneticField,
+                                                                   zeroMagneticField,
+                                                                   gamma,
+                                                                   direction);
+                checkResults(fiducialFlux, scalarFlux, thermalEnergyFlux, testFluxes, outputString, direction);
+            }
+            {
+                std::string const outputString {"Left State:  Constant state, ones magnetic field\n"
+                                                "Right State: Constant state, ones magnetic field\n"
+                                                "HLLD State: Left Double Star"};
+                // Compute the fluxes and check for correctness
+                // Order of Fluxes is rho, vec(V), E, vec(B)
+                std::vector<Real> const fiducialFlux{0, 0.50001380657999994, -1, -1, -1.7347234759768071e-18, 0.0, 3.4694469519536142e-18, 3.4694469519536142e-18};
+                std::vector<Real> const scalarFlux{1.5731381063233131e-14, 3.1670573744690958e-14, 4.7116290424753513e-14};
+                Real thermalEnergyFlux = 0.;
+                std::vector<Real> const testFluxes = computeFluxes(onesMagneticField,
+                    onesMagneticField,
+                                                                   gamma,
+                                                                   direction);
+                checkResults(fiducialFlux, scalarFlux, thermalEnergyFlux, testFluxes, outputString, direction);
+            }
+        }
+    }
+    // =========================================================================
+
     // =========================================================================
     /*!
     * \brief Test the HLLD Riemann Solver with the degenerate state
@@ -1633,11 +1665,11 @@
             negativeDensityPressure.insert(negativeDensityPressure.begin()+5, conservedScalar.begin(), conservedScalar.begin() + NSCALARS);
         #endif  // SCALAR
         #ifdef  DE
-            negativePressure.push_back(mhdUtils::computeThermalEnergy(negativePressure.at(4),negativePressure.at(0),negativePressure.at(1),negativePressure.at(2),negativePressure.at(3),negativePressure.at(5 + NSCALARS),negativePressure.at(6 + NSCALARS),negativePressure.at(7 + NSCALARS),gamma));
-            negativeEnergy.push_back(mhdUtils::computeThermalEnergy(negativeEnergy.at(4),negativeEnergy.at(0),negativeEnergy.at(1),negativeEnergy.at(2),negativeEnergy.at(3),negativeEnergy.at(5 + NSCALARS),negativeEnergy.at(6 + NSCALARS),negativeEnergy.at(7 + NSCALARS),gamma));
-            negativeDensity.push_back(mhdUtils::computeThermalEnergy(negativeDensity.at(4),negativeDensity.at(0),negativeDensity.at(1),negativeDensity.at(2),negativeDensity.at(3),negativeDensity.at(5 + NSCALARS),negativeDensity.at(6 + NSCALARS),negativeDensity.at(7 + NSCALARS),gamma));
-            negativeDensityEnergyPressure.push_back(mhdUtils::computeThermalEnergy(negativeDensityEnergyPressure.at(4),negativeDensityEnergyPressure.at(0),negativeDensityEnergyPressure.at(1),negativeDensityEnergyPressure.at(2),negativeDensityEnergyPressure.at(3),negativeDensityEnergyPressure.at(5 + NSCALARS),negativeDensityEnergyPressure.at(6 + NSCALARS),negativeDensityEnergyPressure.at(7 + NSCALARS),gamma));
-            negativeDensityPressure.push_back(mhdUtils::computeThermalEnergy(negativeDensityPressure.at(4),negativeDensityPressure.at(0),negativeDensityPressure.at(1),negativeDensityPressure.at(2),negativeDensityPressure.at(3),negativeDensityPressure.at(5 + NSCALARS),negativeDensityPressure.at(6 + NSCALARS),negativeDensityPressure.at(7 + NSCALARS),gamma));
+            negativePressure.push_back(mhd::utils::computeThermalEnergy(negativePressure.at(4),negativePressure.at(0),negativePressure.at(1),negativePressure.at(2),negativePressure.at(3),negativePressure.at(5 + NSCALARS),negativePressure.at(6 + NSCALARS),negativePressure.at(7 + NSCALARS),gamma));
+            negativeEnergy.push_back(mhd::utils::computeThermalEnergy(negativeEnergy.at(4),negativeEnergy.at(0),negativeEnergy.at(1),negativeEnergy.at(2),negativeEnergy.at(3),negativeEnergy.at(5 + NSCALARS),negativeEnergy.at(6 + NSCALARS),negativeEnergy.at(7 + NSCALARS),gamma));
+            negativeDensity.push_back(mhd::utils::computeThermalEnergy(negativeDensity.at(4),negativeDensity.at(0),negativeDensity.at(1),negativeDensity.at(2),negativeDensity.at(3),negativeDensity.at(5 + NSCALARS),negativeDensity.at(6 + NSCALARS),negativeDensity.at(7 + NSCALARS),gamma));
+            negativeDensityEnergyPressure.push_back(mhd::utils::computeThermalEnergy(negativeDensityEnergyPressure.at(4),negativeDensityEnergyPressure.at(0),negativeDensityEnergyPressure.at(1),negativeDensityEnergyPressure.at(2),negativeDensityEnergyPressure.at(3),negativeDensityEnergyPressure.at(5 + NSCALARS),negativeDensityEnergyPressure.at(6 + NSCALARS),negativeDensityEnergyPressure.at(7 + NSCALARS),gamma));
+            negativeDensityPressure.push_back(mhd::utils::computeThermalEnergy(negativeDensityPressure.at(4),negativeDensityPressure.at(0),negativeDensityPressure.at(1),negativeDensityPressure.at(2),negativeDensityPressure.at(3),negativeDensityPressure.at(5 + NSCALARS),negativeDensityPressure.at(6 + NSCALARS),negativeDensityPressure.at(7 + NSCALARS),gamma));
         #endif  //DE
 
         for (size_t direction = 0; direction < 3; direction++)
@@ -1726,7 +1758,7 @@
     // =========================================================================
 
     // =========================================================================
-    // Unit tests for the contents of the _hlldInternal namespace
+    // Unit tests for the contents of the mhd::_internal namespace
     // =========================================================================
     /*!
      * \brief A struct to hold some basic test values
@@ -1827,10 +1859,10 @@
             {
                 for (size_t i = 0; i < names.size(); i++)
                 {
-                    gasPressureL.push_back(mhdUtils::computeGasPressure(energyL[i], densityL[i], momentumXL[i], momentumYL[i], momentumZL[i], magneticXL[i], magneticYL[i], magneticZL[i], gamma));
-                    gasPressureR.push_back(mhdUtils::computeGasPressure(energyR[i], densityR[i], momentumXR[i], momentumYR[i], momentumZR[i], magneticXR[i], magneticYR[i], magneticZR[i], gamma));
-                    totalPressureL.push_back(mhdUtils::computeTotalPressure(gasPressureL.back(), magneticXL[i], magneticYL[i], magneticZL[i]));
-                    totalPressureR.push_back(mhdUtils::computeTotalPressure(gasPressureL.back(), magneticXR[i], magneticYR[i], magneticZR[i]));
+                    gasPressureL.push_back(mhd::utils::computeGasPressure(energyL[i], densityL[i], momentumXL[i], momentumYL[i], momentumZL[i], magneticXL[i], magneticYL[i], magneticZL[i], gamma));
+                    gasPressureR.push_back(mhd::utils::computeGasPressure(energyR[i], densityR[i], momentumXR[i], momentumYR[i], momentumZR[i], magneticXR[i], magneticYR[i], magneticZR[i], gamma));
+                    totalPressureL.push_back(mhd::utils::computeTotalPressure(gasPressureL.back(), magneticXL[i], magneticYL[i], magneticZL[i]));
+                    totalPressureR.push_back(mhd::utils::computeTotalPressure(gasPressureL.back(), magneticXR[i], magneticYR[i], magneticZR[i]));
                 }
             }
         };
@@ -1839,7 +1871,7 @@
 
     // =========================================================================
     /*!
-     * \brief Test the _hlldInternal::_approximateWaveSpeeds function
+     * \brief Test the mhd::_internal::_approximateWaveSpeeds function
      *
      */
     TEST(tMHDHlldInternalApproximateWaveSpeeds,
@@ -1850,7 +1882,7 @@
         std::vector<double> const fiducialSpeedR      {24.295526347371595, 12.519790189404299};
         std::vector<double> const fiducialSpeedM      {-0.81760587897407833, -0.026643804611559244};
         std::vector<double> const fiducialSpeedStarL  {-19.710500632936679, -4.4880642018724357};
-        std::vector<double> const fiducialSpeedStarR  {9.777062240423124, 9.17474383484066};
+        std::vector<double> const fiducialSpeedStarR  {9.6740190040662242, 3.4191202933087519};
         std::vector<double> const fiducialDensityStarL{24.101290139122913, 50.132466596958501};
         std::vector<double> const fiducialDensityStarR{78.154104734671265, 84.041595114910123};
 
@@ -1864,7 +1896,7 @@
 
         for (size_t i = 0; i < parameters.names.size(); i++)
         {
-            _hlldInternal::_approximateWaveSpeeds(parameters.densityL[i],
+            mhd::_internal::_approximateWaveSpeeds(parameters.densityL[i],
                                                   parameters.momentumXL[i],
                                                   parameters.momentumYL[i],
                                                   parameters.momentumZL[i],
@@ -1885,7 +1917,6 @@
                                                   parameters.velocityZR[i],
                                                   parameters.gasPressureR[i],
                                                   parameters.totalPressureR[i],
-                                                  parameters.magneticXR[i],
                                                   parameters.magneticYR[i],
                                                   parameters.magneticZR[i],
                                                   parameters.gamma,
@@ -1924,7 +1955,7 @@
 
     // =========================================================================
     /*!
-     * \brief Test the _hlldInternal::_starFluxes function in the non-degenerate
+     * \brief Test the mhd::_internal::_starFluxes function in the non-degenerate
      * case
      *
      */
@@ -1961,7 +1992,7 @@
 
         for (size_t i = 0; i < parameters.names.size(); i++)
         {
-            _hlldInternal::_starFluxes(parameters.speedM[i],
+            mhd::_internal::_starFluxes(parameters.speedM[i],
                                        parameters.speedSide[i],
                                        parameters.densityL[i],
                                        parameters.velocityXL[i],
@@ -2038,7 +2069,7 @@
     }
 
     /*!
-     * \brief Test the _hlldInternal::_starFluxes function in the degenerate
+     * \brief Test the mhd::_internal::_starFluxes function in the degenerate
      * case
      *
      */
@@ -2078,7 +2109,7 @@
 
         for (size_t i = 0; i < parameters.names.size(); i++)
         {
-            _hlldInternal::_starFluxes(parameters.speedM[i],
+            mhd::_internal::_starFluxes(parameters.speedM[i],
                                         parameters.speedSide[i],
                                         parameters.densityL[i],
                                         parameters.velocityXL[i],
@@ -2157,7 +2188,7 @@
 
     // =========================================================================
     /*!
-     * \brief Test the _hlldInternal::_nonStarFluxes function
+     * \brief Test the mhd::_internal::_nonStarFluxes function
      *
      */
     TEST(tMHDHlldInternalNonStarFluxes,
@@ -2183,7 +2214,7 @@
 
         for (size_t i = 0; i < parameters.names.size(); i++)
         {
-            _hlldInternal::_nonStarFluxes(parameters.momentumXL[i],
+            mhd::_internal::_nonStarFluxes(parameters.momentumXL[i],
                                           parameters.velocityXL[i],
                                           parameters.velocityYL[i],
                                           parameters.velocityZL[i],
@@ -2228,38 +2259,7 @@
 
     // =========================================================================
     /*!
-     * \brief Test the _hlldInternal::_dotProduct function
-     *
-     */
-    TEST(tMHDHlldInternalDotProduct,
-         CorrectInputExpectCorrectOutput)
-    {
-        testParams const parameters;
-
-        std::vector<double> const fiducialDotProduct{5149.7597411033557,6127.2319832451567};
-
-        double testDotProduct;
-
-        for (size_t i = 0; i < parameters.names.size(); i++)
-        {
-            testDotProduct = _hlldInternal::_dotProduct(parameters.momentumXL[i],
-                                                        parameters.momentumYL[i],
-                                                        parameters.momentumZL[i],
-                                                        parameters.magneticXL[i],
-                                                        parameters.magneticYL[i],
-                                                        parameters.magneticZL[i]);
-
-            // Now check results
-            testingUtilities::checkResults(fiducialDotProduct[i],
-                                           testDotProduct,
-                                           parameters.names.at(i) + ", DotProduct");
-            }
-    }
-    // =========================================================================
-
-    // =========================================================================
-    /*!
-     * \brief Test the _hlldInternal::_doubleStarState function. Non-degenerate
+     * \brief Test the mhd::_internal::_doubleStarState function. Non-degenerate
      * state
      *
     */
@@ -2286,7 +2286,7 @@
 
         for (size_t i = 0; i < parameters.names.size(); i++)
         {
-            _hlldInternal::_doubleStarState(parameters.speedM[i],
+            mhd::_internal::_doubleStarState(parameters.speedM[i],
                                             parameters.magneticXL[i],
                                             parameters.totalPressureStarL[i],
                                             parameters.densityStarL[i],
@@ -2332,7 +2332,7 @@
     }
 
     /*!
-     * \brief Test the _hlldInternal::_doubleStarState function in the
+     * \brief Test the mhd::_internal::_doubleStarState function in the
      * degenerate state.
      *
     */
@@ -2357,7 +2357,7 @@
 
         for (size_t i = 0; i < parameters.names.size(); i++)
         {
-            _hlldInternal::_doubleStarState(parameters.speedM[i],
+            mhd::_internal::_doubleStarState(parameters.speedM[i],
                                             0.0,
                                             parameters.totalPressureStarL[i],
                                             parameters.densityStarL[i],
@@ -2403,7 +2403,7 @@
 
     // =========================================================================
     /*!
-     * \brief Test the _hlldInternal::_doubleStarFluxes function
+     * \brief Test the mhd::_internal::_doubleStarFluxes function
      *
      */
     TEST(tMHDHlldInternalDoubleStarFluxes,
@@ -2428,7 +2428,7 @@
 
         for (size_t i = 0; i < parameters.names.size(); i++)
         {
-            _hlldInternal::_doubleStarFluxes(parameters.speedSide[i],
+            mhd::_internal::_doubleStarFluxes(parameters.speedSide[i],
                                              parameters.momentumStarFluxX[i],
                                              parameters.momentumStarFluxY[i],
                                              parameters.momentumStarFluxZ[i],
@@ -2480,7 +2480,7 @@
 
     // =========================================================================
     /*!
-     * \brief Test the _hlldInternal::_returnFluxes function
+     * \brief Test the mhd::_internal::_returnFluxes function
      *
      */
     TEST(tMHDHlldInternalReturnFluxes,
@@ -2532,10 +2532,10 @@
             int const fiducialMomentumIndexY = threadId + n_cells * o2;
             int const fiducialMomentumIndexZ = threadId + n_cells * o3;
             int const fiducialEnergyIndex    = threadId + n_cells * 4;
-            int const fiducialMagneticYIndex = threadId + n_cells * (o2 + 4 + NSCALARS);
-            int const fiducialMagneticZIndex = threadId + n_cells * (o3 + 4 + NSCALARS);
+            int const fiducialMagneticYIndex = threadId + n_cells * (5 + NSCALARS);
+            int const fiducialMagneticZIndex = threadId + n_cells * (6 + NSCALARS);
 
-            _hlldInternal::_returnFluxes(threadId,
+            mhd::_internal::_returnFluxes(threadId,
                                          o1,
                                          o2,
                                          o3,
@@ -2578,4 +2578,4 @@
         }
     }
     // =========================================================================
-#endif  // CUDA & HLLD
\ No newline at end of file
+#endif  // CUDA
\ No newline at end of file
diff --git a/src/system_tests/hydro_system_tests.cpp b/src/system_tests/hydro_system_tests.cpp
index 72a6dc349..5ed2b050c 100644
--- a/src/system_tests/hydro_system_tests.cpp
+++ b/src/system_tests/hydro_system_tests.cpp
@@ -13,19 +13,17 @@
 // Local includes
 #include "../system_tests/system_tester.h"
 #include "../utils/testing_utilities.h"
-
-
+#include "../io/io.h"
 
 #ifndef PI
 #define PI 3.141592653589793
 #endif
 
-
 // =============================================================================
-// Test Suite: tHYDROSYSTEMSodShockTube
+// Test Suite: tHYDROtMHDSYSTEMSodShockTube
 // =============================================================================
 /*!
- * \defgroup tHYDROSYSTEMSodShockTubeParameterizedMpi_CorrectInputExpectCorrectOutput
+ * \defgroup tHYDROtMHDSYSTEMSodShockTubeParameterizedMpi_CorrectInputExpectCorrectOutput
  * \brief Test the Sod Shock tube initial conditions as a parameterized test
  * with varying numbers of MPI ranks
  *
@@ -42,6 +40,28 @@ class tHYDROSYSTEMSodShockTubeParameterizedMpi
 TEST_P(tHYDROSYSTEMSodShockTubeParameterizedMpi,
        CorrectInputExpectCorrectOutput)
 {
+    #ifdef  MHD
+      // Loosen correctness check to account for MHD only having PCM. This is
+      // about the error between PCM and PPMP in hydro
+      sodTest.setFixedEpsilon(1E-3);
+
+      // Don't test the gas energy fields
+      auto datasetNames = sodTest.getDataSetsToTest();
+      datasetNames.erase(std::remove(datasetNames.begin(), datasetNames.end(), "GasEnergy"), datasetNames.end());
+
+      // Set the magnetic fiducial datasets to zero
+      size_t const size = std::pow(65, 3);
+      std::vector<double> const magVec(0, size);
+
+      for (auto field: {"magnetic_x","magnetic_y","magnetic_z"})
+      {
+        sodTest.setFiducialData(field, magVec);
+        datasetNames.push_back(field);
+      }
+
+      sodTest.setDataSetsToTest(datasetNames);
+    #endif  //MHD
+
     sodTest.numMpiRanks = GetParam();
     sodTest.runTest();
 }
@@ -52,7 +72,7 @@ INSTANTIATE_TEST_SUITE_P(CorrectInputExpectCorrectOutput,
 /// @}
 // =============================================================================
 
-TEST(tHYDROSYSTEMConstant,
+TEST(tHYDROtMHDSYSTEMConstant,
      CorrectInputExpectCorrectOutput)
 {
   systemTest::SystemTestRunner testObject(false, false, false);
@@ -70,15 +90,15 @@ TEST(tHYDROSYSTEMConstant,
 }
 
 
-TEST(tHYDROSYSTEMSoundWave3D,
+TEST(tHYDROtMHDSYSTEMSoundWave3D,
      CorrectInputExpectCorrectOutput)
 {
   double time = 0.05;
   double amplitude = 1e-5;
   double dx = 1./64.;
-    
+
   double real_kx = 2*PI;//kx of the physical problem
-  
+
   double kx = real_kx * dx;
   double speed = 1;//speed of wave is 1 since P = 0.6 and gamma = 1.666667
   double phase = kx*0.5 - speed * time * real_kx; //kx*0.5 for half-cell offset
@@ -86,12 +106,191 @@ TEST(tHYDROSYSTEMSoundWave3D,
 
   systemTest::SystemTestRunner testObject(false, false, false);
 
+  #ifdef  MHD
+    // Loosen correctness check to account for MHD only having PCM. This is
+    // about the error between PCM and PPMP in hydro
+    tolerance = 1E-6;
+  #endif  //MHD
+
   testObject.launchCholla();
 
   testObject.openHydroTestData();
 
-  testingUtilities::analyticSine(testObject,"density",1.0,amplitude,kx,0.0,0.0,phase,tolerance);
-  testingUtilities::analyticSine(testObject,"momentum_x",0.0,amplitude,kx,0.0,0.0,phase,tolerance);
+  ASSERT_NO_FATAL_FAILURE(testingUtilities::analyticSine(testObject,"density",1.0,amplitude,kx,0.0,0.0,phase,tolerance));
+  ASSERT_NO_FATAL_FAILURE(testingUtilities::analyticSine(testObject,"momentum_x",0.0,amplitude,kx,0.0,0.0,phase,tolerance));
   //testingUtilities::analyticSine(testObject,"momentum_y",0.0,amplitude,kx,0.0,0.0,0.0,tolerance);
   //testingUtilities::analyticSine(testObject,"momentum_z",0.0,amplitude,kx,0.0,0.0,0.0,tolerance);
 }
+
+// =============================================================================
+// Test Suite: tHYDROtMHDSYSTEMLinearWavesParameterizedMpi
+// =============================================================================
+/*!
+ * \defgroup tHYDROtMHDSYSTEMLinearWavesParameterizedMpi
+ * \brief Test the linear waves initial conditions as a parameterized test
+ * with varying numbers of MPI ranks.
+ *
+ */
+/// @{
+class tHYDROtMHDSYSTEMLinearWavesParameterizedMpi
+      :public
+      ::testing::TestWithParam<size_t>
+{
+public:
+    tHYDROtMHDSYSTEMLinearWavesParameterizedMpi()
+    : waveTest(false, true, false, false)
+    {};
+protected:
+    systemTest::SystemTestRunner waveTest;
+
+    #ifdef  PCM
+      double const allowedL1Error = 4E-7; // Based on results in Gardiner & Stone 2008
+      double const allowedError   = 4E-7;
+    #else  //PCM
+      double const allowedL1Error = 1E-7; // Based on results in Gardiner & Stone 2008
+      double const allowedError   = 1E-7;
+    #endif  //PCM
+
+    void setLaunchParams(double const &waveSpeed, double const &rEigenVec_rho,
+                         double const &rEigenVec_MomentumX, double const &rEigenVec_MomentumY,
+                         double const &rEigenVec_MomentumZ, double const &rEigenVec_E,
+                         double const &vx=0.0)
+    {
+        // Constant for all tests
+        size_t const N = 32;
+        double const domain = 0.5;
+        double const gamma = 5./3.;
+        double const tOut = 2*domain / waveSpeed;
+
+        // Settings
+        waveTest.chollaLaunchParams.append(" nx=" + to_string_exact<double>(2*N));
+        waveTest.chollaLaunchParams.append(" ny=" + to_string_exact<double>(N));
+        waveTest.chollaLaunchParams.append(" nz=" + to_string_exact<double>(N));
+        waveTest.chollaLaunchParams.append(" tout=" + to_string_exact<double>(tOut));
+        waveTest.chollaLaunchParams.append(" outstep=" + to_string_exact<double>(tOut));
+        waveTest.chollaLaunchParams.append(" init=Linear_Wave");
+        waveTest.chollaLaunchParams.append(" xmin=0.0");
+        waveTest.chollaLaunchParams.append(" ymin=0.0");
+        waveTest.chollaLaunchParams.append(" zmin=0.0");
+        waveTest.chollaLaunchParams.append(" xlen=" + to_string_exact<double>(2*domain));
+        waveTest.chollaLaunchParams.append(" ylen=" + to_string_exact<double>(domain));
+        waveTest.chollaLaunchParams.append(" zlen=" + to_string_exact<double>(domain));
+        waveTest.chollaLaunchParams.append(" xl_bcnd=1");
+        waveTest.chollaLaunchParams.append(" xu_bcnd=1");
+        waveTest.chollaLaunchParams.append(" yl_bcnd=1");
+        waveTest.chollaLaunchParams.append(" yu_bcnd=1");
+        waveTest.chollaLaunchParams.append(" zl_bcnd=1");
+        waveTest.chollaLaunchParams.append(" zu_bcnd=1");
+        waveTest.chollaLaunchParams.append(" rho=1.0");
+        waveTest.chollaLaunchParams.append(" vx=" + to_string_exact<double>(vx));
+        waveTest.chollaLaunchParams.append(" vy=0");
+        waveTest.chollaLaunchParams.append(" vz=0");
+        waveTest.chollaLaunchParams.append(" P=" + to_string_exact<double>(1/gamma));
+        waveTest.chollaLaunchParams.append(" Bx=0");
+        waveTest.chollaLaunchParams.append(" By=0");
+        waveTest.chollaLaunchParams.append(" Bz=0");
+        waveTest.chollaLaunchParams.append(" A='1e-6'");
+        waveTest.chollaLaunchParams.append(" gamma=" + to_string_exact<double>(gamma));
+        waveTest.chollaLaunchParams.append(" rEigenVec_rho="       + to_string_exact<double>(rEigenVec_rho));
+        waveTest.chollaLaunchParams.append(" rEigenVec_MomentumX=" + to_string_exact<double>(rEigenVec_MomentumX));
+        waveTest.chollaLaunchParams.append(" rEigenVec_MomentumY=" + to_string_exact<double>(rEigenVec_MomentumY));
+        waveTest.chollaLaunchParams.append(" rEigenVec_MomentumZ=" + to_string_exact<double>(rEigenVec_MomentumZ));
+        waveTest.chollaLaunchParams.append(" rEigenVec_E="         + to_string_exact<double>(rEigenVec_E));
+        waveTest.chollaLaunchParams.append(" rEigenVec_Bx=0");
+        waveTest.chollaLaunchParams.append(" rEigenVec_By=0");
+        waveTest.chollaLaunchParams.append(" rEigenVec_Bz=0");
+    }
+};
+
+// Sound Waves Moving Left and Right
+// =================================
+TEST_P(tHYDROtMHDSYSTEMLinearWavesParameterizedMpi,
+       SoundWaveRightMovingCorrectInputExpectCorrectOutput)
+{
+    // Specific to this test
+    double const waveSpeed = 1.;
+    int const numTimeSteps = 214;
+
+    double const rEigenVec_rho       = 1;
+    double const rEigenVec_MomentumX = 1;
+    double const rEigenVec_MomentumY = 1;
+    double const rEigenVec_MomentumZ = 1;
+    double const rEigenVec_E         = 1.5;
+
+    // Set the launch parameters
+    setLaunchParams(waveSpeed, rEigenVec_rho, rEigenVec_MomentumX,
+                    rEigenVec_MomentumY, rEigenVec_MomentumZ, rEigenVec_E);
+
+    // Set the number of MPI ranks
+    waveTest.numMpiRanks = GetParam();
+
+    // Set the number of timesteps
+    waveTest.setFiducialNumTimeSteps(numTimeSteps);
+
+    // Check Results
+    waveTest.runL1ErrorTest(2*allowedL1Error, allowedError);
+}
+
+TEST_P(tHYDROtMHDSYSTEMLinearWavesParameterizedMpi,
+       SoundWaveLeftMovingCorrectInputExpectCorrectOutput)
+{
+    // Specific to this test
+    double const waveSpeed = 1.;
+    int const numTimeSteps = 214;
+
+    double const rEigenVec_rho       = 1;
+    double const rEigenVec_MomentumX = -1;
+    double const rEigenVec_MomentumY = 1;
+    double const rEigenVec_MomentumZ = 1;
+    double const rEigenVec_E         = 1.5;
+
+    // Set the launch parameters
+    setLaunchParams(waveSpeed, rEigenVec_rho, rEigenVec_MomentumX,
+                    rEigenVec_MomentumY, rEigenVec_MomentumZ, rEigenVec_E);
+
+    // Set the number of MPI ranks
+    waveTest.numMpiRanks = GetParam();
+
+    // Set the number of timesteps
+    waveTest.setFiducialNumTimeSteps(numTimeSteps);
+
+    // Check Results
+    waveTest.runL1ErrorTest(2*allowedL1Error, allowedError);
+}
+
+// Contact Waves Moving Left and Right
+// ===================================
+TEST_P(tHYDROtMHDSYSTEMLinearWavesParameterizedMpi,
+       HydroContactWaveCorrectInputExpectCorrectOutput)
+{
+    // Specific to this test
+    double const waveSpeed = 1.0;
+    int const numTimeSteps = 427;
+
+    double const rEigenVec_rho       = 1;
+    double const rEigenVec_MomentumX = 1;
+    double const rEigenVec_MomentumY = 0;
+    double const rEigenVec_MomentumZ = 0;
+    double const rEigenVec_E         = 0.5;
+    double const velocityX           = waveSpeed;
+
+    // Set the launch parameters
+    setLaunchParams(waveSpeed, rEigenVec_rho, rEigenVec_MomentumX,
+                    rEigenVec_MomentumY, rEigenVec_MomentumZ, rEigenVec_E,
+                    velocityX);
+
+    // Set the number of MPI ranks
+    waveTest.numMpiRanks = GetParam();
+
+    // Set the number of timesteps
+    waveTest.setFiducialNumTimeSteps(numTimeSteps);
+
+    // Check Results
+    waveTest.runL1ErrorTest(allowedL1Error, allowedError);
+}
+
+INSTANTIATE_TEST_SUITE_P(,
+                         tHYDROtMHDSYSTEMLinearWavesParameterizedMpi,
+                         ::testing::Values(1));
+/// @}
+// =============================================================================
\ No newline at end of file
diff --git a/src/system_tests/input_files/blank_settings_file.txt b/src/system_tests/input_files/blank_settings_file.txt
new file mode 100644
index 000000000..e8fbd7e77
--- /dev/null
+++ b/src/system_tests/input_files/blank_settings_file.txt
@@ -0,0 +1,3 @@
+# This is blank file for system tests that are setting all the parameters
+# internally to point at. Without a blank file cholla will crash
+
diff --git a/src/system_tests/input_files/tHYDROSYSTEMConstant_CorrectInputExpectCorrectOutput.txt b/src/system_tests/input_files/tHYDROtMHDSYSTEMConstant_CorrectInputExpectCorrectOutput.txt
similarity index 100%
rename from src/system_tests/input_files/tHYDROSYSTEMConstant_CorrectInputExpectCorrectOutput.txt
rename to src/system_tests/input_files/tHYDROtMHDSYSTEMConstant_CorrectInputExpectCorrectOutput.txt
diff --git a/src/system_tests/input_files/tHYDROSYSTEMSoundWave3D_CorrectInputExpectCorrectOutput.txt b/src/system_tests/input_files/tHYDROtMHDSYSTEMSoundWave3D_CorrectInputExpectCorrectOutput.txt
similarity index 70%
rename from src/system_tests/input_files/tHYDROSYSTEMSoundWave3D_CorrectInputExpectCorrectOutput.txt
rename to src/system_tests/input_files/tHYDROtMHDSYSTEMSoundWave3D_CorrectInputExpectCorrectOutput.txt
index f1c23ea6e..efdedaceb 100644
--- a/src/system_tests/input_files/tHYDROSYSTEMSoundWave3D_CorrectInputExpectCorrectOutput.txt
+++ b/src/system_tests/input_files/tHYDROtMHDSYSTEMSoundWave3D_CorrectInputExpectCorrectOutput.txt
@@ -14,7 +14,7 @@ tout=0.05
 # time interval for output
 outstep=0.05
 # name of initial conditions
-init=Sound_Wave
+init=Linear_Wave
 # domain properties
 xmin=0.0
 ymin=0.0
@@ -34,18 +34,31 @@ outdir=./
 
 #################################################
 # Parameters for linear wave problems
-# initial density 
+# initial density
 rho=1.0
-# velocity in the x direction 
+# velocity in the x direction
 vx=0
 # velocity in the y direction
 vy=0
 # velocity in the z direction
 vz=0
-# initial pressure 
+# initial pressure
 P=0.6
 # amplitude of perturbing oscillations
 A=1e-5
 # value of gamma
 gamma=1.666666666666667
+# The right eigenvectors to set the wave properly
+rEigenVec_rho=1
+rEigenVec_MomentumX=1
+rEigenVec_MomentumY=1
+rEigenVec_MomentumZ=1
+rEigenVec_E=1.5
 
+# Set the magnetic field quantities to zero
+Bx=0
+By=0
+Bz=0
+rEigenVec_Bx=0
+rEigenVec_By=0
+rEigenVec_Bz=0
\ No newline at end of file
diff --git a/src/system_tests/input_files/tMHDSYSTEMConstantParameterizedMpi_MagneticFieldCorrectInputExpectCorrectOutput.txt b/src/system_tests/input_files/tMHDSYSTEMConstantParameterizedMpi_MagneticFieldCorrectInputExpectCorrectOutput.txt
new file mode 100644
index 000000000..eabea0e60
--- /dev/null
+++ b/src/system_tests/input_files/tMHDSYSTEMConstantParameterizedMpi_MagneticFieldCorrectInputExpectCorrectOutput.txt
@@ -0,0 +1,50 @@
+#
+# Parameter File for 3D box filled with gas
+#
+
+################################################
+# number of grid cells in the x dimension
+nx=16
+# number of grid cells in the y dimension
+ny=16
+# number of grid cells in the z dimension
+nz=16
+# final output time
+tout=100000.0
+# time interval for output
+outstep=100000.0
+# name of initial conditions
+init=Constant
+# domain properties
+xmin=0.0
+ymin=0.0
+zmin=0.0
+xlen=1.0
+ylen=1.0
+zlen=1.0
+# type of boundary conditions
+xl_bcnd=1
+xu_bcnd=1
+yl_bcnd=1
+yu_bcnd=1
+zl_bcnd=1
+zu_bcnd=1
+# path to output directory
+outdir=./
+
+#################################################
+# density
+rho=1e4
+# velocity
+vx=0
+vy=0
+vz=0
+# pressure
+P=1.380658e-5
+# Magnetic Field
+Bx=1.0e-5
+By=2.0e-5
+Bz=3.0e-5
+# value of gamma
+gamma=1.666666667
+
diff --git a/src/system_tests/input_files/tMHDSYSTEMConstantParameterizedMpi_ZeroMagneticFieldCorrectInputExpectCorrectOutput.txt b/src/system_tests/input_files/tMHDSYSTEMConstantParameterizedMpi_ZeroMagneticFieldCorrectInputExpectCorrectOutput.txt
new file mode 100644
index 000000000..4f52b7cd6
--- /dev/null
+++ b/src/system_tests/input_files/tMHDSYSTEMConstantParameterizedMpi_ZeroMagneticFieldCorrectInputExpectCorrectOutput.txt
@@ -0,0 +1,50 @@
+#
+# Parameter File for 3D box filled with gas
+#
+
+################################################
+# number of grid cells in the x dimension
+nx=16
+# number of grid cells in the y dimension
+ny=16
+# number of grid cells in the z dimension
+nz=16
+# final output time
+tout=100000.0
+# time interval for output
+outstep=100000.0
+# name of initial conditions
+init=Constant
+# domain properties
+xmin=0.0
+ymin=0.0
+zmin=0.0
+xlen=1.0
+ylen=1.0
+zlen=1.0
+# type of boundary conditions
+xl_bcnd=1
+xu_bcnd=1
+yl_bcnd=1
+yu_bcnd=1
+zl_bcnd=1
+zu_bcnd=1
+# path to output directory
+outdir=./
+
+#################################################
+# density
+rho=1e4
+# velocity
+vx=0
+vy=0
+vz=0
+# pressure
+P=1.380658e-5
+# Magnetic Field
+Bx=0.0
+By=0.0
+Bz=0.0
+# value of gamma
+gamma=1.666666667
+
diff --git a/src/system_tests/input_files/tMHDSYSTEMEinfeldtStrongRarefaction_CorrectInputExpectCorrectOutput.txt b/src/system_tests/input_files/tMHDSYSTEMEinfeldtStrongRarefaction_CorrectInputExpectCorrectOutput.txt
new file mode 100644
index 000000000..3e4747551
--- /dev/null
+++ b/src/system_tests/input_files/tMHDSYSTEMEinfeldtStrongRarefaction_CorrectInputExpectCorrectOutput.txt
@@ -0,0 +1,71 @@
+#
+# Parameter File for 3D Einfeldt Strong Rarefaction MHD test
+# Citation: Einfeldt et al. 1991 "On Godunov-Type Methods near Low Densities"
+#
+
+################################################
+# number of grid cells in the x dimension
+nx=32
+# number of grid cells in the y dimension
+ny=32
+# number of grid cells in the z dimension
+nz=32
+# final output time
+tout=0.16
+# time interval for output
+outstep=0.16
+# name of initial conditions
+init=Riemann
+
+# domain properties
+xmin=0.0
+ymin=0.0
+zmin=0.0
+xlen=1.0
+ylen=1.0
+zlen=1.0
+
+# type of boundary conditions
+xl_bcnd=3
+xu_bcnd=3
+yl_bcnd=3
+yu_bcnd=3
+zl_bcnd=3
+zu_bcnd=3
+
+# path to output directory
+outdir=./
+
+#################################################
+# Parameters for 1D Riemann problems
+# density of left state
+rho_l=1.0
+# velocity of left state
+vx_l=-2.0
+vy_l=0.0
+vz_l=0.0
+# pressure of left state
+P_l=0.45
+# Magnetic field of the left state
+Bx_l=0.0
+By_l=0.5
+Bz_l=0.0
+
+# density of right state
+rho_r=1.0
+# velocity of right state
+vx_r=2.0
+vy_r=0.0
+vz_r=0.0
+# pressure of right state
+P_r=0.45
+# Magnetic field of the right state
+Bx_r=0.0
+By_r=0.5
+Bz_r=0.0
+
+# location of initial discontinuity
+diaph=0.5
+# value of gamma
+gamma=1.4
+
diff --git a/src/system_tests/input_files/tMHDSYSTEMSodShockTubeParameterizedMpi_CorrectInputExpectCorrectOutput.txt b/src/system_tests/input_files/tMHDSYSTEMSodShockTubeParameterizedMpi_CorrectInputExpectCorrectOutput.txt
new file mode 100644
index 000000000..6fb66732b
--- /dev/null
+++ b/src/system_tests/input_files/tMHDSYSTEMSodShockTubeParameterizedMpi_CorrectInputExpectCorrectOutput.txt
@@ -0,0 +1,57 @@
+#
+# Parameter File for 1D Sod Shock tube
+#
+
+################################################
+# number of grid cells in the x dimension
+nx=64
+# number of grid cells in the y dimension
+ny=64
+# number of grid cells in the z dimension
+nz=64
+# final output time
+tout=0.2
+# time interval for output
+outstep=0.2
+# name of initial conditions
+init=Riemann
+# domain properties
+xmin=0.0
+ymin=0.0
+zmin=0.0
+xlen=1.0
+ylen=1.0
+zlen=1.0
+# type of boundary conditions
+xl_bcnd=3
+xu_bcnd=3
+yl_bcnd=0
+yu_bcnd=0
+zl_bcnd=0
+zu_bcnd=0
+# path to output directory
+outdir=./
+
+#################################################
+# Parameters for 1D Riemann problems
+# density of left state
+rho_l=1.0
+# velocity of left state
+vx_l=0.0
+vy_l=0.0
+vz_l=0.0
+# pressure of left state
+P_l=1.0
+# density of right state
+rho_r=0.1
+# velocity of right state
+vx_r=0.0
+vy_r=0.0
+vz_r=0.0
+# pressure of right state
+P_r=0.1
+# location of initial discontinuity
+diaph=0.5
+# value of gamma
+gamma=1.4
+
diff --git a/src/system_tests/mhd_system_tests.cpp b/src/system_tests/mhd_system_tests.cpp
new file mode 100644
index 000000000..39cec0b89
--- /dev/null
+++ b/src/system_tests/mhd_system_tests.cpp
@@ -0,0 +1,636 @@
+/*!
+ * \file mhd_system_tests.cpp
+ * \author Robert 'Bob' Caddy (rvc@pitt.edu)
+ * \brief Contains all the system tests for the MHD build type
+ *
+ */
+
+// STL includes
+#include <cmath>
+
+// External Libraries and Headers
+#include <gtest/gtest.h>
+
+// Local includes
+#include "../system_tests/system_tester.h"
+#include "../io/io.h"
+
+// =============================================================================
+// Test Suite: tMHDSYSTEMConstantParameterizedMpi
+// =============================================================================
+/*!
+ * \defgroup tMHDSYSTEMConstantParameterizedMpi
+ * \brief Test the constant initial conditions as a parameterized test
+ * with varying numbers of MPI ranks
+ *
+ */
+/// @{
+class tMHDSYSTEMConstantParameterizedMpi
+      :public
+      ::testing::TestWithParam<size_t>
+{
+protected:
+    systemTest::SystemTestRunner constantTest;
+};
+
+// Test with all mangetic fields set to zero
+TEST_P(tMHDSYSTEMConstantParameterizedMpi,
+       ZeroMagneticFieldCorrectInputExpectCorrectOutput)
+{
+    constantTest.numMpiRanks = GetParam();
+    constantTest.runTest();
+}
+
+// Test with all mangetic fields set to one
+TEST_P(tMHDSYSTEMConstantParameterizedMpi,
+       MagneticFieldCorrectInputExpectCorrectOutput)
+{
+    constantTest.numMpiRanks = GetParam();
+    constantTest.runTest();
+}
+
+INSTANTIATE_TEST_SUITE_P(,
+                         tMHDSYSTEMConstantParameterizedMpi,
+                         ::testing::Values(1, 2, 4));
+/// @}
+// =============================================================================
+
+// =============================================================================
+// Test Suite: tMHDSYSTEMLinearWavesParameterizedAngle
+// =============================================================================
+/*!
+ * \defgroup tMHDSYSTEMLinearWavesParameterizedAngle
+ * \brief Test the linear waves initial conditions as a parameterized test
+ * with varying angles. Details in Gardiner & Stone 2008
+ *
+ */
+/// @{
+class tMHDSYSTEMLinearWavesParameterizedAngle
+      :public
+      ::testing::TestWithParam<std::tuple<double, double, double, int>>
+{
+public:
+    tMHDSYSTEMLinearWavesParameterizedAngle()
+    : waveTest(false, true, false, false){};
+protected:
+    systemTest::SystemTestRunner waveTest;
+
+    #ifdef  PCM
+      double const allowedL1Error = 4E-7; // Based on results in Gardiner & Stone 2008
+      double const allowedError   = 4E-7;
+    #else  //PCM
+      double const allowedL1Error = 1E-7; // Based on results in Gardiner & Stone 2008
+      double const allowedError   = 1E-7;
+    #endif  //PCM
+
+    void setLaunchParams(double const &waveSpeed, double const &rEigenVec_rho,
+                         double const &rEigenVec_MomentumX, double const &rEigenVec_MomentumY,
+                         double const &rEigenVec_MomentumZ, double const &rEigenVec_E,
+                         double const &rEigenVec_Bx, double const &rEigenVec_By,
+                         double const &rEigenVec_Bz, double const &pitch,
+                         double const &yaw, double const &domain,
+                         int const &domain_direction, double const &vx=0.0)
+    {
+        // Constant for all tests
+        size_t const N = 32;
+        double const gamma = 5./3.;
+        double const tOut = 2*domain / waveSpeed;
+
+        // Define vector values
+        double x_len=domain, y_len=domain, z_len=domain;
+        int nx=N, ny=N, nz=N;
+        double vx_rot=vx, vy_rot=0, vz_rot=0;
+        double Bx_rot=1, By_rot=1.5, Bz_rot=0;
+
+        double rEigenVec_Bx_rot = rEigenVec_Bx;
+        double rEigenVec_By_rot = rEigenVec_By;
+        double rEigenVec_Bz_rot = rEigenVec_Bz;
+
+        double rEigenVec_MomentumX_rot = rEigenVec_MomentumX;
+        double rEigenVec_MomentumY_rot = rEigenVec_MomentumY;
+        double rEigenVec_MomentumZ_rot = rEigenVec_MomentumZ;
+
+        switch (domain_direction)
+        {
+        case 1:
+            x_len *= 2;
+            nx *= 2;
+            break;
+        case 2:  // swap X and Y
+            y_len *= 2;
+            ny *= 2;
+            std::swap(vx_rot, vy_rot);
+            std::swap(Bx_rot, By_rot);
+            std::swap(rEigenVec_Bx_rot, rEigenVec_By_rot);
+            std::swap(rEigenVec_MomentumX_rot, rEigenVec_MomentumY_rot);
+            break;
+        case 3: // swap X and Z
+            z_len *= 2;
+            nz *= 2;
+            std::swap(vx_rot, vz_rot);
+            std::swap(Bx_rot, Bz_rot);
+            std::swap(rEigenVec_Bx_rot, rEigenVec_Bz_rot);
+            std::swap(rEigenVec_MomentumX_rot, rEigenVec_MomentumZ_rot);
+            break;
+        default:
+            throw std::invalid_argument("Invalid value of domain_direction given to setLaunchParams");
+            break;
+        }
+
+        // Settings
+        waveTest.chollaLaunchParams.append(" nx=" + to_string_exact<int>(nx));
+        waveTest.chollaLaunchParams.append(" ny=" + to_string_exact<int>(ny));
+        waveTest.chollaLaunchParams.append(" nz=" + to_string_exact<int>(nz));
+        waveTest.chollaLaunchParams.append(" tout=" + to_string_exact<double>(tOut));
+        waveTest.chollaLaunchParams.append(" outstep=" + to_string_exact<double>(tOut));
+        waveTest.chollaLaunchParams.append(" init=Linear_Wave");
+        waveTest.chollaLaunchParams.append(" xmin=0.0");
+        waveTest.chollaLaunchParams.append(" ymin=0.0");
+        waveTest.chollaLaunchParams.append(" zmin=0.0");
+        waveTest.chollaLaunchParams.append(" xlen=" + to_string_exact<double>(x_len));
+        waveTest.chollaLaunchParams.append(" ylen=" + to_string_exact<double>(y_len));
+        waveTest.chollaLaunchParams.append(" zlen=" + to_string_exact<double>(z_len));
+        waveTest.chollaLaunchParams.append(" xl_bcnd=1");
+        waveTest.chollaLaunchParams.append(" xu_bcnd=1");
+        waveTest.chollaLaunchParams.append(" yl_bcnd=1");
+        waveTest.chollaLaunchParams.append(" yu_bcnd=1");
+        waveTest.chollaLaunchParams.append(" zl_bcnd=1");
+        waveTest.chollaLaunchParams.append(" zu_bcnd=1");
+        waveTest.chollaLaunchParams.append(" rho=1.0");
+        waveTest.chollaLaunchParams.append(" vx=" + to_string_exact<double>(vx_rot));
+        waveTest.chollaLaunchParams.append(" vy=" + to_string_exact<double>(vy_rot));
+        waveTest.chollaLaunchParams.append(" vz=" + to_string_exact<double>(vz_rot));
+        waveTest.chollaLaunchParams.append(" P="  + to_string_exact<double>(1/gamma));
+        waveTest.chollaLaunchParams.append(" Bx=" + to_string_exact<double>(Bx_rot));
+        waveTest.chollaLaunchParams.append(" By=" + to_string_exact<double>(By_rot));
+        waveTest.chollaLaunchParams.append(" Bz=" + to_string_exact<double>(Bz_rot));
+        waveTest.chollaLaunchParams.append(" A='1e-6'");
+        waveTest.chollaLaunchParams.append(" gamma=" + to_string_exact<double>(gamma));
+        waveTest.chollaLaunchParams.append(" rEigenVec_rho="       + to_string_exact<double>(rEigenVec_rho));
+        waveTest.chollaLaunchParams.append(" rEigenVec_MomentumX=" + to_string_exact<double>(rEigenVec_MomentumX_rot));
+        waveTest.chollaLaunchParams.append(" rEigenVec_MomentumY=" + to_string_exact<double>(rEigenVec_MomentumY_rot));
+        waveTest.chollaLaunchParams.append(" rEigenVec_MomentumZ=" + to_string_exact<double>(rEigenVec_MomentumZ_rot));
+        waveTest.chollaLaunchParams.append(" rEigenVec_E="         + to_string_exact<double>(rEigenVec_E));
+        waveTest.chollaLaunchParams.append(" rEigenVec_Bx="        + to_string_exact<double>(rEigenVec_Bx_rot));
+        waveTest.chollaLaunchParams.append(" rEigenVec_By="        + to_string_exact<double>(rEigenVec_By_rot));
+        waveTest.chollaLaunchParams.append(" rEigenVec_Bz="        + to_string_exact<double>(rEigenVec_Bz_rot));
+        waveTest.chollaLaunchParams.append(" pitch="               + to_string_exact<double>(pitch));
+        waveTest.chollaLaunchParams.append(" yaw="                 + to_string_exact<double>(yaw));
+    }
+};
+
+// Fast Magnetosonic Waves Moving Left and Right
+// =============================================
+TEST_P(tMHDSYSTEMLinearWavesParameterizedAngle,
+       FastMagnetosonicWaveRightMovingCorrectInputExpectCorrectOutput)
+{
+    // Specific to this test
+    double const waveSpeed = 2.;
+    std::vector<int> const numTimeSteps = {214, 204, 220};
+
+    double const prefix = 1./(2*std::sqrt(5));
+    double const rEigenVec_rho       = prefix * 2;
+    double const rEigenVec_MomentumX = prefix * 4;
+    double const rEigenVec_MomentumY = prefix * -2; // + for left wave
+    double const rEigenVec_MomentumZ = prefix * 0;
+    double const rEigenVec_Bx        = prefix * 0;
+    double const rEigenVec_By        = prefix * 4;
+    double const rEigenVec_Bz        = prefix * 0;
+    double const rEigenVec_E         = prefix * 9;
+
+    // Get the test parameters
+    auto [pitch, yaw, domain, domain_direction] = GetParam();
+
+    // Set the launch parameters
+    setLaunchParams(waveSpeed, rEigenVec_rho, rEigenVec_MomentumX,
+                    rEigenVec_MomentumY, rEigenVec_MomentumZ, rEigenVec_E,
+                    rEigenVec_Bx, rEigenVec_By, rEigenVec_Bz, pitch, yaw, domain,
+                    domain_direction);
+
+    // Set the number of timesteps
+    waveTest.setFiducialNumTimeSteps(numTimeSteps[domain_direction-1]);
+
+    // Check Results
+    #ifdef  PCM
+        waveTest.runL1ErrorTest(4.2E-7, 5.4E-7);
+    #else  //PCM
+        waveTest.runL1ErrorTest(allowedL1Error, allowedError);
+    #endif  //PCM
+}
+
+TEST_P(tMHDSYSTEMLinearWavesParameterizedAngle,
+       FastMagnetosonicWaveLeftMovingCorrectInputExpectCorrectOutput)
+{
+    // Specific to this test
+    double const waveSpeed = 2.;
+    std::vector<int> const numTimeSteps = {214, 204, 220};
+
+    double const prefix = 1./(2*std::sqrt(5));
+    double const rEigenVec_rho       = prefix * 2;
+    double const rEigenVec_MomentumX = prefix * -4;
+    double const rEigenVec_MomentumY = prefix * 2;
+    double const rEigenVec_MomentumZ = prefix * 0;
+    double const rEigenVec_Bx        = prefix * 0;
+    double const rEigenVec_By        = prefix * 4;
+    double const rEigenVec_Bz        = prefix * 0;
+    double const rEigenVec_E         = prefix * 9;
+
+    // Get the test parameters
+    auto [pitch, yaw, domain, domain_direction] = GetParam();
+
+    // Set the launch parameters
+    setLaunchParams(waveSpeed, rEigenVec_rho, rEigenVec_MomentumX,
+                    rEigenVec_MomentumY, rEigenVec_MomentumZ, rEigenVec_E,
+                    rEigenVec_Bx, rEigenVec_By, rEigenVec_Bz, pitch, yaw, domain,
+                    domain_direction);
+
+    // Set the number of timesteps
+    waveTest.setFiducialNumTimeSteps(numTimeSteps[domain_direction-1]);
+
+    // Check Results
+    #ifdef  PCM
+        waveTest.runL1ErrorTest(4.2E-7, 5.4E-7);
+    #else  //PCM
+        waveTest.runL1ErrorTest(allowedL1Error, allowedError);
+    #endif  //PCM
+}
+
+// Slow Magnetosonic Waves Moving Left and Right
+// =============================================
+TEST_P(tMHDSYSTEMLinearWavesParameterizedAngle,
+       SlowMagnetosonicWaveRightMovingCorrectInputExpectCorrectOutput)
+{
+    // Specific to this test
+    double const waveSpeed = 0.5;
+    std::vector<int> const numTimeSteps = {854, 813, 880};
+
+    double const prefix = 1./(2*std::sqrt(5));
+    double const rEigenVec_rho       = prefix * 4;
+    double const rEigenVec_MomentumX = prefix * 2;
+    double const rEigenVec_MomentumY = prefix * 4;
+    double const rEigenVec_MomentumZ = prefix * 0;
+    double const rEigenVec_Bx        = prefix * 0;
+    double const rEigenVec_By        = prefix * -2;
+    double const rEigenVec_Bz        = prefix * 0;
+    double const rEigenVec_E         = prefix * 3;
+
+    // Get the test parameters
+    auto [pitch, yaw, domain, domain_direction] = GetParam();
+
+    // Set the launch parameters
+    setLaunchParams(waveSpeed, rEigenVec_rho, rEigenVec_MomentumX,
+                    rEigenVec_MomentumY, rEigenVec_MomentumZ, rEigenVec_E,
+                    rEigenVec_Bx, rEigenVec_By, rEigenVec_Bz, pitch, yaw, domain,
+                    domain_direction);
+
+    // Set the number of timesteps
+    waveTest.setFiducialNumTimeSteps(numTimeSteps[domain_direction-1]);
+
+    // Check Results
+    waveTest.runL1ErrorTest(allowedL1Error, allowedError);
+}
+
+TEST_P(tMHDSYSTEMLinearWavesParameterizedAngle,
+       SlowMagnetosonicWaveLeftMovingCorrectInputExpectCorrectOutput)
+{
+    // Specific to this test
+    double const waveSpeed = 0.5;
+    std::vector<int> const numTimeSteps = {854, 813, 880};
+
+    double const prefix = 1./(2*std::sqrt(5));
+    double const rEigenVec_rho       = prefix * 4;
+    double const rEigenVec_MomentumX = prefix * -2;
+    double const rEigenVec_MomentumY = prefix * -4;
+    double const rEigenVec_MomentumZ = prefix * 0;
+    double const rEigenVec_Bx        = prefix * 0;
+    double const rEigenVec_By        = prefix * -2;
+    double const rEigenVec_Bz        = prefix * 0;
+    double const rEigenVec_E         = prefix * 3;
+
+    // Get the test parameters
+    auto [pitch, yaw, domain, domain_direction] = GetParam();
+
+    // Set the launch parameters
+    setLaunchParams(waveSpeed, rEigenVec_rho, rEigenVec_MomentumX,
+                    rEigenVec_MomentumY, rEigenVec_MomentumZ, rEigenVec_E,
+                    rEigenVec_Bx, rEigenVec_By, rEigenVec_Bz, pitch, yaw, domain,
+                    domain_direction);
+
+    // Set the number of timesteps
+    waveTest.setFiducialNumTimeSteps(numTimeSteps[domain_direction-1]);
+
+    // Check Results
+    waveTest.runL1ErrorTest(allowedL1Error, allowedError);
+}
+
+// Alfven Waves Moving Left and Right
+// =============================================
+TEST_P(tMHDSYSTEMLinearWavesParameterizedAngle,
+       AlfvenWaveRightMovingCorrectInputExpectCorrectOutput)
+{
+    // Specific to this test
+    double const waveSpeed = 1.0;
+    std::vector<int> const numTimeSteps = {427, 407, 440};
+
+    double const rEigenVec_rho       = 0;
+    double const rEigenVec_MomentumX = 0;
+    double const rEigenVec_MomentumY = 0;
+    double const rEigenVec_MomentumZ = -1;
+    double const rEigenVec_Bx        = 0;
+    double const rEigenVec_By        = 0;
+    double const rEigenVec_Bz        = 1;
+    double const rEigenVec_E         = 0;
+
+    // Get the test parameters
+    auto [pitch, yaw, domain, domain_direction] = GetParam();
+
+    // Set the launch parameters
+    setLaunchParams(waveSpeed, rEigenVec_rho, rEigenVec_MomentumX,
+                    rEigenVec_MomentumY, rEigenVec_MomentumZ, rEigenVec_E,
+                    rEigenVec_Bx, rEigenVec_By, rEigenVec_Bz, pitch, yaw, domain,
+                    domain_direction);
+
+    // Set the number of timesteps
+    waveTest.setFiducialNumTimeSteps(numTimeSteps[domain_direction-1]);
+
+    // Check Results
+    waveTest.runL1ErrorTest(allowedL1Error, allowedError);
+}
+
+TEST_P(tMHDSYSTEMLinearWavesParameterizedAngle,
+       AlfvenWaveLeftMovingCorrectInputExpectCorrectOutput)
+{
+    // Specific to this test
+    double const waveSpeed = 1.0;
+    std::vector<int> const numTimeSteps = {427, 407, 440};
+
+    double const rEigenVec_rho       = 0;
+    double const rEigenVec_MomentumX = 0;
+    double const rEigenVec_MomentumY = 0;
+    double const rEigenVec_MomentumZ = 1;
+    double const rEigenVec_Bx        = 0;
+    double const rEigenVec_By        = 0;
+    double const rEigenVec_Bz        = 1;
+    double const rEigenVec_E         = 0;
+
+    // Get the test parameters
+    auto [pitch, yaw, domain, domain_direction] = GetParam();
+
+    // Set the launch parameters
+    setLaunchParams(waveSpeed, rEigenVec_rho, rEigenVec_MomentumX,
+                    rEigenVec_MomentumY, rEigenVec_MomentumZ, rEigenVec_E,
+                    rEigenVec_Bx, rEigenVec_By, rEigenVec_Bz, pitch, yaw, domain,
+                    domain_direction);
+
+    // Set the number of timesteps
+    waveTest.setFiducialNumTimeSteps(numTimeSteps[domain_direction-1]);
+
+    // Check Results
+    waveTest.runL1ErrorTest(allowedL1Error, allowedError);
+}
+
+// Contact Wave Moving Right
+// ===================================
+TEST_P(tMHDSYSTEMLinearWavesParameterizedAngle,
+       MHDContactWaveCorrectInputExpectCorrectOutput)
+{
+    // Specific to this test
+    double const waveSpeed = 1.0;
+    std::vector<int> const numTimeSteps = {641, 620, 654};
+
+    double const rEigenVec_rho       = 1;
+    double const rEigenVec_MomentumX = 1;
+    double const rEigenVec_MomentumY = 0;
+    double const rEigenVec_MomentumZ = 0;
+    double const rEigenVec_Bx        = 0;
+    double const rEigenVec_By        = 0;
+    double const rEigenVec_Bz        = 0;
+    double const rEigenVec_E         = 0.5;
+    double const velocityX           = waveSpeed;
+
+    // Get the test parameters
+    auto [pitch, yaw, domain, domain_direction] = GetParam();
+
+    // Set the launch parameters
+    setLaunchParams(waveSpeed, rEigenVec_rho, rEigenVec_MomentumX,
+                    rEigenVec_MomentumY, rEigenVec_MomentumZ, rEigenVec_E,
+                    rEigenVec_Bx, rEigenVec_By, rEigenVec_Bz, pitch, yaw, domain,
+                    domain_direction, velocityX);
+
+    // Set the number of timesteps
+    waveTest.setFiducialNumTimeSteps(numTimeSteps[domain_direction-1]);
+
+    // Check Results
+    #ifdef  PCM
+    waveTest.runL1ErrorTest(1.35*allowedL1Error, 1.35*allowedError);
+    #else  //PCM
+    waveTest.runL1ErrorTest(allowedL1Error, allowedError);
+    #endif  //PCM
+}
+
+INSTANTIATE_TEST_SUITE_P(,
+                         tMHDSYSTEMLinearWavesParameterizedAngle,
+                         ::testing::Values(
+                                           std::make_tuple(0.0*M_PI, 0.0*M_PI, 0.5, 1),
+                                           std::make_tuple(0.0*M_PI, 0.5*M_PI, 0.5, 2),
+                                           std::make_tuple(0.5*M_PI, 0.0*M_PI, 0.5, 3)
+                                           //std::make_tuple(std::asin(2./3.), std::asin(2./std::sqrt(5.)), 1.5, 1)
+                                           ));
+/// @}
+// =============================================================================
+
+// =============================================================================
+// Test Suite: tMHDSYSTEMSodShockTube
+// TODO: This is temporary. Remove once PPMP is implemented for MHD and replace
+// with the hydro sod test
+// =============================================================================
+/*!
+ * \defgroup tMHDSYSTEMSodShockTubeParameterizedMpi_CorrectInputExpectCorrectOutput
+ * \brief Test the Sod Shock tube initial conditions as a parameterized test
+ * with varying numbers of MPI ranks
+ *
+ */
+/// @{
+class tMHDSYSTEMSodShockTubeParameterizedMpi
+      :public
+      ::testing::TestWithParam<size_t>
+{
+protected:
+    systemTest::SystemTestRunner sodTest;
+};
+
+TEST_P(tMHDSYSTEMSodShockTubeParameterizedMpi,
+       CorrectInputExpectCorrectOutput)
+{
+    sodTest.numMpiRanks = GetParam();
+    sodTest.runTest();
+}
+
+INSTANTIATE_TEST_SUITE_P(CorrectInputExpectCorrectOutput,
+                         tMHDSYSTEMSodShockTubeParameterizedMpi,
+                         ::testing::Values(1, 2, 4));
+/// @}
+// =============================================================================
+
+// =============================================================================
+// Test Suite: tMHDSYSTEMEinfeldtStrongRarefaction
+// =============================================================================
+TEST(tMHDSYSTEMEinfeldtStrongRarefaction,
+       CorrectInputExpectCorrectOutput)
+{
+    systemTest::SystemTestRunner rarefactionTest;
+    rarefactionTest.runTest();
+}
+// =============================================================================
+
+// =============================================================================
+// Test Suite: tMHDSYSTEMLinearWavesParameterizedMpi
+// =============================================================================
+/*!
+ * \defgroup tMHDSYSTEMLinearWavesParameterizedMpi
+ * \brief Test the linear waves initial conditions as a parameterized test
+ * with varying numbers of MPI ranks. Details in Gardiner & Stone 2008
+ *
+ */
+/// @{
+class tMHDSYSTEMLinearWavesParameterizedMpi
+      :public
+      ::testing::TestWithParam<int>
+{
+public:
+    tMHDSYSTEMLinearWavesParameterizedMpi()
+    : waveTest(false, true, false, false){};
+protected:
+    systemTest::SystemTestRunner waveTest;
+
+    #ifdef  PCM
+      double const allowedL1Error = 4E-7; // Based on results in Gardiner & Stone 2008
+      double const allowedError   = 4E-7;
+    #else  //PCM
+      double const allowedL1Error = 1E-7; // Based on results in Gardiner & Stone 2008
+      double const allowedError   = 1E-7;
+    #endif  //PCM
+
+    void setLaunchParams(double const &waveSpeed, double const &rEigenVec_rho,
+                         double const &rEigenVec_MomentumX, double const &rEigenVec_MomentumY,
+                         double const &rEigenVec_MomentumZ, double const &rEigenVec_E,
+                         double const &rEigenVec_Bx, double const &rEigenVec_By,
+                         double const &rEigenVec_Bz)
+    {
+        // Constant for all tests
+        size_t const N = 32;
+        double const gamma = 5./3.;
+        double const domain = 0.5;
+        double const tOut = 2*domain / waveSpeed;
+
+        // Settings
+        waveTest.chollaLaunchParams.append(" nx=" + to_string_exact<int>(2*N));
+        waveTest.chollaLaunchParams.append(" ny=" + to_string_exact<int>(N));
+        waveTest.chollaLaunchParams.append(" nz=" + to_string_exact<int>(N));
+        waveTest.chollaLaunchParams.append(" tout=" + to_string_exact<double>(tOut));
+        waveTest.chollaLaunchParams.append(" outstep=" + to_string_exact<double>(tOut));
+        waveTest.chollaLaunchParams.append(" init=Linear_Wave");
+        waveTest.chollaLaunchParams.append(" xmin=0.0");
+        waveTest.chollaLaunchParams.append(" ymin=0.0");
+        waveTest.chollaLaunchParams.append(" zmin=0.0");
+        waveTest.chollaLaunchParams.append(" xlen=" + to_string_exact<double>(2*domain));
+        waveTest.chollaLaunchParams.append(" ylen=" + to_string_exact<double>(domain));
+        waveTest.chollaLaunchParams.append(" zlen=" + to_string_exact<double>(domain));
+        waveTest.chollaLaunchParams.append(" xl_bcnd=1");
+        waveTest.chollaLaunchParams.append(" xu_bcnd=1");
+        waveTest.chollaLaunchParams.append(" yl_bcnd=1");
+        waveTest.chollaLaunchParams.append(" yu_bcnd=1");
+        waveTest.chollaLaunchParams.append(" zl_bcnd=1");
+        waveTest.chollaLaunchParams.append(" zu_bcnd=1");
+        waveTest.chollaLaunchParams.append(" rho=1.0");
+        waveTest.chollaLaunchParams.append(" vx=0");
+        waveTest.chollaLaunchParams.append(" vy=0");
+        waveTest.chollaLaunchParams.append(" vz=0");
+        waveTest.chollaLaunchParams.append(" P="  + to_string_exact<double>(1/gamma));
+        waveTest.chollaLaunchParams.append(" Bx=1");
+        waveTest.chollaLaunchParams.append(" By=1.5");
+        waveTest.chollaLaunchParams.append(" Bz=0");
+        waveTest.chollaLaunchParams.append(" A='1e-6'");
+        waveTest.chollaLaunchParams.append(" gamma=" + to_string_exact<double>(gamma));
+        waveTest.chollaLaunchParams.append(" rEigenVec_rho="       + to_string_exact<double>(rEigenVec_rho));
+        waveTest.chollaLaunchParams.append(" rEigenVec_MomentumX=" + to_string_exact<double>(rEigenVec_MomentumX));
+        waveTest.chollaLaunchParams.append(" rEigenVec_MomentumY=" + to_string_exact<double>(rEigenVec_MomentumY));
+        waveTest.chollaLaunchParams.append(" rEigenVec_MomentumZ=" + to_string_exact<double>(rEigenVec_MomentumZ));
+        waveTest.chollaLaunchParams.append(" rEigenVec_E="         + to_string_exact<double>(rEigenVec_E));
+        waveTest.chollaLaunchParams.append(" rEigenVec_Bx="        + to_string_exact<double>(rEigenVec_Bx));
+        waveTest.chollaLaunchParams.append(" rEigenVec_By="        + to_string_exact<double>(rEigenVec_By));
+        waveTest.chollaLaunchParams.append(" rEigenVec_Bz="        + to_string_exact<double>(rEigenVec_Bz));
+    }
+};
+
+// Slow Magnetosonic Waves Moving Left and Right
+// =============================================
+TEST_P(tMHDSYSTEMLinearWavesParameterizedMpi,
+       SlowMagnetosonicWaveRightMovingCorrectInputExpectCorrectOutput)
+{
+    // Specific to this test
+    double const waveSpeed = 0.5;
+    int const numTimeSteps = 854;
+
+    double const prefix = 1./(2*std::sqrt(5));
+    double const rEigenVec_rho       = prefix * 4;
+    double const rEigenVec_MomentumX = prefix * 2;
+    double const rEigenVec_MomentumY = prefix * 4;
+    double const rEigenVec_MomentumZ = prefix * 0;
+    double const rEigenVec_Bx        = prefix * 0;
+    double const rEigenVec_By        = prefix * -2;
+    double const rEigenVec_Bz        = prefix * 0;
+    double const rEigenVec_E         = prefix * 3;
+
+    // Get the test parameters
+    waveTest.numMpiRanks = GetParam();
+
+    // Set the launch parameters
+    setLaunchParams(waveSpeed, rEigenVec_rho, rEigenVec_MomentumX,
+                    rEigenVec_MomentumY, rEigenVec_MomentumZ, rEigenVec_E,
+                    rEigenVec_Bx, rEigenVec_By, rEigenVec_Bz);
+
+    // Set the number of timesteps
+    waveTest.setFiducialNumTimeSteps(numTimeSteps);
+
+    // Check Results
+    waveTest.runL1ErrorTest(allowedL1Error, allowedError);
+}
+
+TEST_P(tMHDSYSTEMLinearWavesParameterizedMpi,
+       SlowMagnetosonicWaveLeftMovingCorrectInputExpectCorrectOutput)
+{
+    // Specific to this test
+    double const waveSpeed = 0.5;
+    int const numTimeSteps = 854;
+
+    double const prefix = 1./(2*std::sqrt(5));
+    double const rEigenVec_rho       = prefix * 4;
+    double const rEigenVec_MomentumX = prefix * -2;
+    double const rEigenVec_MomentumY = prefix * -4;
+    double const rEigenVec_MomentumZ = prefix * 0;
+    double const rEigenVec_Bx        = prefix * 0;
+    double const rEigenVec_By        = prefix * -2;
+    double const rEigenVec_Bz        = prefix * 0;
+    double const rEigenVec_E         = prefix * 3;
+
+    // Get the test parameters
+    waveTest.numMpiRanks = GetParam();
+
+    // Set the launch parameters
+    setLaunchParams(waveSpeed, rEigenVec_rho, rEigenVec_MomentumX,
+                    rEigenVec_MomentumY, rEigenVec_MomentumZ, rEigenVec_E,
+                    rEigenVec_Bx, rEigenVec_By, rEigenVec_Bz);
+
+    // Set the number of timesteps
+    waveTest.setFiducialNumTimeSteps(numTimeSteps);
+
+    // Check Results
+    waveTest.runL1ErrorTest(allowedL1Error, allowedError);
+}
+
+INSTANTIATE_TEST_SUITE_P(,
+                         tMHDSYSTEMLinearWavesParameterizedMpi,
+                         ::testing::Values(1, 2, 4));
+/// @}
+// =============================================================================
\ No newline at end of file
diff --git a/src/system_tests/system_tester.cpp b/src/system_tests/system_tester.cpp
index c59e6e770..a2835ce7c 100644
--- a/src/system_tests/system_tester.cpp
+++ b/src/system_tests/system_tester.cpp
@@ -21,6 +21,7 @@
 // Local includes
 #include "../system_tests/system_tester.h" // Include the header file
 #include "../utils/testing_utilities.h"
+#include "../io/io.h"
 
 // =============================================================================
 // Public Members
@@ -154,8 +155,7 @@ void systemTest::SystemTestRunner::runTest()
         else
         {
             // This is a field data set
-            testData = loadTestFieldData(dataSetName,
-                                          testDims);
+            testData = loadTestFieldData(dataSetName, testDims);
             // Get fiducial data
             fiducialData = _loadFiducialFieldData(dataSetName);
         }
@@ -178,14 +178,11 @@ void systemTest::SystemTestRunner::runTest()
                     // Check for equality and iff not equal return difference
                     double absoluteDiff;
                     int64_t ulpsDiff;
-                    // Fixed epsilon is changed from the default since AMD/Clang
-                    // appear to differ from NVIDIA/GCC/XL by roughly 1E-12
-                    double fixedEpsilon = 5.0E-12;
                     bool areEqual = testingUtilities::nearlyEqualDbl(fiducialData.at(index),
                                                                      testData.at(index),
                                                                      absoluteDiff,
                                                                      ulpsDiff,
-                                                                     fixedEpsilon);
+                                                                     _fixedEpsilon);
                     ASSERT_TRUE(areEqual)
                         << std::endl
                         << "Difference in "
@@ -203,6 +200,136 @@ void systemTest::SystemTestRunner::runTest()
 }
 // =============================================================================
 
+// =============================================================================
+void systemTest::SystemTestRunner::runL1ErrorTest(double const &maxAllowedL1Error,
+                                                  double const &maxAllowedError)
+{
+    /// Only run if this variable is set to `true`. Generally this and
+    /// globalCompareSystemTestResults should only be used for large MPI / tests
+    /// where the user wishes to separate the execution of cholla and the /
+    /// comparison of results onto different machines/jobs
+    if (globalRunCholla)
+    {
+        // Launch Cholla. Note that this dumps all console output to the console
+        // log file as requested by the user.
+        launchCholla();
+    }
+
+    // Check that there is hydro data and no particle data
+    if (_particleDataExists)
+    {
+        std::string errMessage = "Error: SystemTestRunner::runL1ErrorTest does not support particles";
+        throw std::runtime_error(errMessage);
+    }
+    if (not _hydroDataExists)
+    {
+        std::string errMessage = "Error: SystemTestRunner::runL1ErrorTest requires hydro data";
+        throw std::runtime_error(errMessage);
+    }
+
+    /// If set to false then no comparison will be performed. Generally this and
+    /// globalRunCholla should only be used for large MPI tests where the user
+    /// wishes to separate the execution of cholla and the comparison of results
+    /// onto different machines/jobs
+    if (not globalCompareSystemTestResults) return;
+
+    // Make sure we have all the required data files and open the data files
+    _testHydroFieldsFileVec.resize(numMpiRanks);
+    std::vector<H5::H5File> initialHydroFieldsFileVec(numMpiRanks);
+    for (size_t fileIndex = 0; fileIndex < numMpiRanks; fileIndex++)
+    {
+        // Initial time data
+        std::string fileName = "/0.h5." + std::to_string(fileIndex);
+        _checkFileExists(_outputDirectory + fileName);
+        initialHydroFieldsFileVec[fileIndex].openFile(_outputDirectory + fileName,
+                                                    H5F_ACC_RDONLY);
+
+        // Final time data
+        fileName = "/1.h5." + std::to_string(fileIndex);
+        _checkFileExists(_outputDirectory + fileName);
+        _testHydroFieldsFileVec[fileIndex].openFile(_outputDirectory + fileName,
+                                                    H5F_ACC_RDONLY);
+    }
+
+    // Get the list of test dataset names
+    _fiducialDataSetNames = _findDataSetNames(initialHydroFieldsFileVec[0]);
+    _testDataSetNames = _findDataSetNames(_testHydroFieldsFileVec[0]);
+
+    // Start Performing Checks
+    // =======================
+    // Check the number of time steps
+    if (_compareNumTimeSteps) _checkNumTimeSteps();
+
+    // Check that the test file has as many, or more, datasets than the fiducial
+    // file. Provide a warning if the datasets are not the same size
+    EXPECT_GE(_testDataSetNames.size(), _fiducialDataSetNames.size())
+        << std::endl
+        << "Warning: The test data has "
+        << _testDataSetNames.size()
+        <<  " datasets and the fiducial data has "
+        << _fiducialDataSetNames.size()
+        << " datasets" << std::endl << std::endl;
+
+    // Loop over the datasets to be tested
+    double L2Norm = 0;
+    double maxError = 0;
+    for (auto dataSetName: _fiducialDataSetNames)
+    {
+        if (dataSetName == "GasEnergy")
+        {
+            continue;
+        }
+
+        // check that the test data has the dataset in it
+        ASSERT_EQ(std::count(_testDataSetNames.begin(), _testDataSetNames.end(), dataSetName), 1)
+            << "The test data does not contain the dataset '" + dataSetName
+            + "' or contains it more than once.";
+
+        // Get data vectors
+        std::vector<size_t> initialDims(3,1);
+        std::vector<double> initialData;
+        std::vector<size_t> finalDims(3,1);
+        std::vector<double> finalData;
+
+        // This is a field data set
+        initialData = loadTestFieldData(dataSetName, initialDims, initialHydroFieldsFileVec);
+        // Get fiducial data
+        finalData = loadTestFieldData(dataSetName, finalDims, _testHydroFieldsFileVec);
+
+        // Check that they're the same length
+        ASSERT_EQ(initialData.size(), finalData.size())
+                                        << "The initial and final '"
+                                        << dataSetName
+                                        << "' datasets are not the same length";
+
+        // Compute the L1 Error.
+        double L1Error = 0;
+        for (size_t i = 0; i < initialData.size(); i++)
+        {
+            double const diff = std::abs(initialData.at(i) - finalData.at(i));
+            L1Error += diff;
+            maxError = (diff > maxError)? diff: maxError;
+        }
+
+        L1Error *= (1./static_cast<double>(initialDims[0]*initialDims[1]*initialDims[2]));
+        L2Norm  += L1Error * L1Error;
+
+        // Perform the correctness check
+        EXPECT_LT(L1Error, maxAllowedL1Error) << "the L1 error for the "
+                                              << dataSetName
+                                              << " data has exceeded the allowed value";
+    }
+
+    // Check the L1 Norm
+    L2Norm = std::sqrt(L2Norm);
+    EXPECT_LT(L2Norm, maxAllowedL1Error)
+        << "the norm of the L1 error vector has exceeded the allowed value";
+
+    // Check the Max Error
+    EXPECT_LT(maxError, maxAllowedError) << "The maximum error has exceeded the allowed value";
+}
+// =============================================================================
+
 // =============================================================================
 void systemTest::SystemTestRunner::launchCholla()
 {
@@ -250,11 +377,11 @@ void systemTest::SystemTestRunner::setFiducialData(std::string const &fieldName,
                                                    std::vector<double> const &dataVec)
 {
     // First check if there's a fiducial data file
-    if (_fiducialFileExists)
+    if (_fiducialDataSets.count(fieldName) > 0)
     {
-        std::string errMessage = "Error: Fiducial data file already exists for test '"
-                                 + _fullTestFileName
-                                 + "' and cannot be overwritten.";
+        std::string errMessage = "Error: Fiducial dataset for field '"
+                                 + fieldName
+                                 + "' already exists and cannot be overwritten";
         throw std::runtime_error(errMessage);
     }
 
@@ -333,17 +460,41 @@ systemTest::SystemTestRunner::SystemTestRunner(bool const &particleData,
     _fullTestFileName = fullTestName.substr(0, fullTestName.find("/"));
 
     // Generate the input paths. Strip out everything after a "/" since that
-    // probably indicates a parameterized test
+    // probably indicates a parameterized test. Also, check that the files exist
+    // and load fiducial HDF5 file if required
     _chollaPath         = ::globalChollaRoot.getString()
                           + "/bin/cholla."
                           + ::globalChollaBuild.getString()
                           + "." + ::globalChollaMachine.getString();
-    _chollaSettingsPath = ::globalChollaRoot.getString()
-                          + "/src/system_tests/input_files/"
-                          + _fullTestFileName + ".txt";
+    _checkFileExists(_chollaPath);
+    if (useSettingsFile)
+    {
+        _chollaSettingsPath = ::globalChollaRoot.getString()
+                            + "/src/system_tests/input_files/"
+                            + _fullTestFileName + ".txt";
+        _checkFileExists(_chollaSettingsPath);
+    }
+    else
+    {
+        _chollaSettingsPath = ::globalChollaRoot.getString()
+                            + "/src/system_tests/input_files/"
+                            + "blank_settings_file.txt";
+        _checkFileExists(_chollaSettingsPath);
+    }
+    if (useFiducialFile)
+    {
     _fiducialFilePath   = ::globalChollaRoot.getString()
                           + "/cholla-tests-data/system_tests/"
                           + _fullTestFileName + ".h5";
+        _checkFileExists(_fiducialFilePath);
+        _fiducialFile.openFile(_fiducialFilePath, H5F_ACC_RDONLY);
+        _fiducialDataSetNames = _findDataSetNames(_fiducialFile);
+        _fiducialFileExists   = true;
+    }
+    else
+    {
+        _fiducialFilePath = "";
+    }
 
     // Generate output paths, these files don't exist yet
     _outputDirectory    = ::globalChollaRoot.getString() + "/bin/" + fullTestName;
@@ -360,17 +511,6 @@ systemTest::SystemTestRunner::SystemTestRunner(bool const &particleData,
                       + "' either already exists or could not be created."
                       << std::endl;
     }
-
-    // Check that the files exist and load fiducial HDF5 file if required
-    _checkFileExists(_chollaPath);
-    if (useSettingsFile) _checkFileExists(_chollaSettingsPath);
-    if (useFiducialFile)
-    {
-        _checkFileExists(_fiducialFilePath);
-        _fiducialFile.openFile(_fiducialFilePath, H5F_ACC_RDONLY);
-        _fiducialDataSetNames = _findDataSetNames(_fiducialFile);
-        _fiducialFileExists   = true;
-    };
 }
 // =============================================================================
 
@@ -463,22 +603,25 @@ void systemTest::SystemTestRunner::_checkNumTimeSteps()
 // =============================================================================
 std::vector<double> systemTest::SystemTestRunner::loadTestFieldData(
         std::string dataSetName,
-        std::vector<size_t> &testDims)
+        std::vector<size_t> &testDims,
+        std::vector<H5::H5File> file)
 {
-    // Get the file we're using
-    std::vector<H5::H5File> file;
+    // Switch which fileset we're using if it's a particle dataset
     if (dataSetName == "particle_density")
     {
         file = _testParticlesFileVec;
         dataSetName = "density";
     }
-    else
+    else if (file.size() == 0)
     {
         file = _testHydroFieldsFileVec;
     }
 
-    // Get the size of each dimension
-    H5::Attribute dimensions = file[0].openAttribute("dims");
+    // Get the size of each dimension. First check if the field is a magnetic
+    // field or not to make sure we're retreiving the right dimensions
+    std::string dimsName = (dataSetName.find("magnetic") != std::string::npos)?
+                            "magnetic_field_dims": "dims";
+    H5::Attribute dimensions = file[0].openAttribute(dimsName.c_str());
     dimensions.read(H5::PredType::NATIVE_ULONG, testDims.data());
 
     // Allocate the vector
@@ -510,7 +653,9 @@ std::vector<double> systemTest::SystemTestRunner::loadTestFieldData(
 
         // Get dims_local
         std::vector<int> dimsLocal(3,1);
-        H5::Attribute dimsLocalAttr = file[rank].openAttribute("dims_local");
+        std::string dimsNameLocal = (dataSetName.find("magnetic") != std::string::npos)?
+                                    "magnetic_field_dims_local": "dims_local";
+        H5::Attribute dimsLocalAttr = file[rank].openAttribute(dimsNameLocal.c_str());
         dimsLocalAttr.read(H5::PredType::NATIVE_INT, dimsLocal.data());
 
         // Now we add the data to the larger vector
diff --git a/src/system_tests/system_tester.h b/src/system_tests/system_tester.h
index 6d5aa1925..29b8b74d0 100644
--- a/src/system_tests/system_tester.h
+++ b/src/system_tests/system_tester.h
@@ -72,9 +72,24 @@ class systemTest::SystemTestRunner
      */
     void runTest();
 
+    /*!
+     * \brief Compute the L1 error for each field compared to the initial
+     * conditions. Doesn't work with particle data
+     *
+     * \param[in] maxAllowedL1Error The maximum allowed L1 error for this test
+     * \param[in] maxAllowedError The maximum allowed for any value in the test
+     *
+     */
+    void runL1ErrorTest(double const &maxAllowedL1Error, double const &maxAllowedError=1E-7);
+
+    /*!
+     * \brief Launch Cholla as it is set up
+     *
+     */
     void launchCholla();
 
     void openHydroTestData();
+
     /*!
      * \brief Get the Cholla Path object
      *
@@ -128,6 +143,13 @@ class systemTest::SystemTestRunner
      */
     std::vector<std::string> getDataSetsToTest(){return _fiducialDataSetNames;};
 
+    /*!
+     * \brief Set the Fixed Epsilon value
+     *
+     * \param[in] newVal The new value of fixed epsilon
+     */
+    void setFixedEpsilon(double const &newVal){_fixedEpsilon = newVal;};
+
     /*!
      * \brief Choose which datasets to test. By default it tests all the
      * datasets in the fiducial data. A warning will be thrown if not all the
@@ -193,10 +215,12 @@ class systemTest::SystemTestRunner
      *
      * \param[in] dataSetName The name of the dataset to get
      * \param[out] testDims An vector with the length of each dimension in it
+     * \param[in] file (optional) The vector of HDF5 files to load
      * \return std::vector<double> A vector containing the data
      */
     std::vector<double> loadTestFieldData(std::string dataSetName,
-					  std::vector<size_t> &testDims);
+                                          std::vector<size_t> &testDims,
+                                          std::vector<H5::H5File> file={});
 
     /*!
      * \brief Generate a std::vector of the specified size populated by a sine
@@ -241,7 +265,7 @@ class systemTest::SystemTestRunner
      * \param[in] useSettingsFile Indicate if you're using a settings file. If
      * `true` then the settings file is automatically found based on the naming
      * convention. If false then the user MUST provide all the required settings
-     * with the SystemTestRunner::setChollaLaunchParams method
+     * with the SystemTestRunner::chollaLaunchParams member variable
      */
     SystemTestRunner(bool const &particleData=false,
                      bool const &hydroData=true,
@@ -290,6 +314,10 @@ class systemTest::SystemTestRunner
     /// The total number of particles in the fiducial dataset
     size_t _fiducialTotalNumParticles=0;
 
+    /// Fixed epsilon is changed from the default since AMD/Clang
+    /// appear to differ from NVIDIA/GCC/XL by roughly 1E-12
+    double _fixedEpsilon = 5.0E-12;
+
     /// Flag to indicate if a fiducial HDF5 data file is being used or a
     /// programmatically generated H5File object. `true` = use a file, `false` =
     /// use generated H5File object
diff --git a/src/utils/DeviceVector.h b/src/utils/DeviceVector.h
index 422f3d151..ca0cacba8 100644
--- a/src/utils/DeviceVector.h
+++ b/src/utils/DeviceVector.h
@@ -1,5 +1,5 @@
 /*!
- * \file device_vector.h
+ * \file DeviceVector.h
  * \author Robert 'Bob' Caddy (rvc@pitt.edu)
  * \brief Contains the declartion and implementation of the DeviceVector
  * class. Note that since this is a templated class the implementation must be
@@ -48,8 +48,10 @@ namespace cuda_utilities
          *
          * \param[in] size The number of elements desired in the array. Can be
          * any positive integer.
+         * \param[in] initialize (optional) If true then initialize the GPU
+         * memory to int(0)
          */
-        DeviceVector(size_t const size) {_allocate(size);}
+        DeviceVector(size_t const size, bool const initialize=false);
 
         /*!
          * \brief Destroy the Device Vector object by calling the `_deAllocate`
@@ -178,7 +180,7 @@ namespace cuda_utilities
         void _allocate(size_t const size)
         {
             _size=size;
-            CudaSafeCall(cudaMalloc(&_ptr, size*sizeof(T)));
+            CudaSafeCall(cudaMalloc(&_ptr, _size*sizeof(T)));
         }
 
         /*!
@@ -198,11 +200,23 @@ namespace cuda_utilities
 // =============================================================================
 namespace cuda_utilities
 {
-
     // =========================================================================
     // Public Methods
     // =========================================================================
 
+    // =========================================================================
+    template <typename T>
+    DeviceVector<T>::DeviceVector(size_t const size, bool const initialize)
+    {
+        _allocate(size);
+
+        if (initialize)
+        {
+            CudaSafeCall(cudaMemset(_ptr, 0, _size*sizeof(T)));
+        }
+    }
+    // =========================================================================
+
     // =========================================================================
     template <typename T>
     void DeviceVector<T>::resize(size_t const newSize)
diff --git a/src/utils/DeviceVector_tests.cu b/src/utils/DeviceVector_tests.cu
index 26a63dbca..3db21baee 100644
--- a/src/utils/DeviceVector_tests.cu
+++ b/src/utils/DeviceVector_tests.cu
@@ -1,5 +1,5 @@
 /*!
- * \file device_vector_tests.cu
+ * \file DeviceVector_tests.cu
  * \author Robert 'Bob' Caddy (rvc@pitt.edu)
  * \brief Tests for the DeviceVector class
  *
@@ -81,7 +81,7 @@ TEST(tALLDeviceVectorDestructor,
 
    // Get the pointer information
    cudaPointerAttributes ptrAttributes;
-   CudaSafeCall(cudaPointerGetAttributes(&ptrAttributes, devVector.data()));
+   cudaPointerGetAttributes(&ptrAttributes, devVector.data());
 
     // Warning strings
     std::string typeMessage          = "ptrAttributes.type should be 0 since "
@@ -106,6 +106,9 @@ TEST(tALLDeviceVectorDestructor,
     #endif  // O_HIP
     EXPECT_EQ(nullptr, ptrAttributes.devicePointer) << devPtrMessage;
     EXPECT_EQ(nullptr, ptrAttributes.hostPointer)   << hostPtrMessage;
+
+    // Reconstruct DeviceVector object to avoid error
+    new (&devVector) cuda_utilities::DeviceVector<double>{vectorSize};
 }
 
 TEST(tALLDeviceVectorStdVectorHostToDeviceCopyAndIndexing,
diff --git a/src/utils/cuda_utilities.h b/src/utils/cuda_utilities.h
index 9c07a95a6..3f0ae5fba 100644
--- a/src/utils/cuda_utilities.h
+++ b/src/utils/cuda_utilities.h
@@ -12,7 +12,6 @@
 #include "../global/global_cuda.h"
 #include "../utils/gpu.hpp"
 
-
 namespace cuda_utilities
 {
     /*!
@@ -75,25 +74,61 @@ namespace cuda_utilities
         }
     }
 
-    // =========================================================================
     /*!
-    * \brief Set the value that `pointer` points at in GPU memory to `value`.
-    * This only sets the first value in memory so if `pointer` points to an
-    * array then only `pointer[0]` will be set; i.e. this effectively does
-    * `pointer = &value`
-    *
-    * \tparam T Any scalar type
-    * \param[in] pointer The location in GPU memory
-    * \param[in] value The value to set `*pointer` to
-    */
-    template <typename T>
-    void setScalarDeviceMemory(T *pointer, T const value)
+     * \brief Initialize GPU memory
+     *
+     * \param[in] ptr The pointer to GPU memory
+     * \param[in] N The size of the array in bytes
+     */
+    inline void initGpuMemory(Real *ptr, size_t N)
     {
-        CudaSafeCall(
-            cudaMemcpy(pointer,  // destination
-                       &value,   // source
-                       sizeof(T),
-                       cudaMemcpyHostToDevice));
+        CudaSafeCall(cudaMemset(ptr, 0, N));
     }
-    // =========================================================================
-}
\ No newline at end of file
+
+    // =====================================================================
+    /*!
+     * \brief Struct to determine the optimal number of blocks and threads
+     * per block to use when launching a kernel. The member
+     * variables are `threadsPerBlock` and `numBlocks` which are chosen with
+     the occupancy API. Can target any device on the system through the
+     * optional constructor argument.
+     * NOTE: On AMD there's currently an issue that stops kernels from being
+     * passed. As a workaround for now this struct just returns the maximum
+     * number of blocks and threads per block that a MI250X can run at once.
+     *
+     */
+    template <typename T>
+    struct AutomaticLaunchParams
+    {
+    public:
+        /*!
+         * \brief Construct a new Reduction Launch Params object. By default it
+         * generates values of numBlocks and threadsPerBlock suitable for a
+         * kernel with a grid-stride loop. For a kernel with one thread per
+         * element set the optional `numElements` argument to the number of
+         * elements
+         *
+         * \param[in] kernel The kernel to determine the launch parameters for
+         * \param[in] numElements The number of elements in the array that
+         the kernel operates on
+         */
+        AutomaticLaunchParams(T &kernel, size_t numElements=0)
+        {
+            cudaOccupancyMaxPotentialBlockSize(&numBlocks, &threadsPerBlock, kernel, 0, 0);
+
+            if (numElements > 0)
+            {
+                numBlocks = (numElements + threadsPerBlock - 1) / threadsPerBlock;
+            }
+        }
+
+        /// Defaulted Destructor
+        ~AutomaticLaunchParams()=default;
+
+        /// The maximum number of threads per block that the device supports
+        int threadsPerBlock;
+        /// The maximum number of scheduleable blocks on the device
+        int numBlocks;
+    };
+    // =====================================================================
+} // end namespace cuda_utilities
diff --git a/src/utils/cuda_utilities_tests.cpp b/src/utils/cuda_utilities_tests.cpp
index ddefebfd7..dc2f20066 100644
--- a/src/utils/cuda_utilities_tests.cpp
+++ b/src/utils/cuda_utilities_tests.cpp
@@ -120,23 +120,3 @@ TEST(tALLCompute1DIndex,
     EXPECT_EQ(fiducialId, testId);
 }
 // =============================================================================
-
-// =============================================================================
-TEST(tALLSetScalarDeviceMemory,
-     TypeDoubleInputExpectCorrectValueSet)
-{
-    double value = 173.246;
-    double *dev_ptr, host_val;
-    CudaSafeCall(cudaMalloc(&dev_ptr, sizeof(double)));
-
-    cuda_utilities::setScalarDeviceMemory<double>(dev_ptr, value);
-
-    CudaSafeCall(
-        cudaMemcpy(&host_val,  // destination
-                    dev_ptr,    // source
-                    sizeof(double),
-                    cudaMemcpyDeviceToHost));
-
-    EXPECT_EQ(value, host_val);
-}
-// =============================================================================
diff --git a/src/utils/gpu.hpp b/src/utils/gpu.hpp
index 4c285965e..66f2885f2 100644
--- a/src/utils/gpu.hpp
+++ b/src/utils/gpu.hpp
@@ -20,7 +20,7 @@ static void __attribute__((unused)) check(const hipfftResult err, const char *co
   exit(err);
 }
 
-#endif  // PARIS PARIC_GALACTIC
+#endif  //CUFFT PARIS PARIS_GALACTIC
 
 #define WARPSIZE 64
 static constexpr int maxWarpsPerBlock = 1024/WARPSIZE;
@@ -53,6 +53,7 @@ static constexpr int maxWarpsPerBlock = 1024/WARPSIZE;
 #define cudaMemcpy hipMemcpy
 #define cudaMemcpyAsync hipMemcpyAsync
 #define cudaMemcpyPeer hipMemcpyPeer
+#define cudaMemcpyPeer hipMemcpyPeer
 #define cudaMemcpyDeviceToHost hipMemcpyDeviceToHost
 #define cudaMemcpyDeviceToDevice hipMemcpyDeviceToDevice
 #define cudaMemcpyHostToDevice hipMemcpyHostToDevice
@@ -65,10 +66,11 @@ static constexpr int maxWarpsPerBlock = 1024/WARPSIZE;
 #define cudaGetDeviceProperties hipGetDeviceProperties
 #define cudaPointerAttributes hipPointerAttribute_t
 #define cudaPointerGetAttributes hipPointerGetAttributes
+#define cudaOccupancyMaxPotentialBlockSize hipOccupancyMaxPotentialBlockSize
 
 // Texture definitions
 #define cudaArray hipArray
-#define cudaMallocArray hipMallocArray 
+#define cudaMallocArray hipMallocArray
 #define cudaFreeArray hipFreeArray
 #define cudaMemcpyToArray hipMemcpyToArray
 #define cudaMemcpy2DToArray hipMemcpy2DToArray
@@ -87,8 +89,10 @@ static constexpr int maxWarpsPerBlock = 1024/WARPSIZE;
 #define cudaTextureDesc hipTextureDesc
 #define cudaAddressModeClamp hipAddressModeClamp
 #define cudaFilterModeLinear hipFilterModeLinear
-#define cudaFilterModePoint hipFilterModePoint 
+#define cudaFilterModePoint hipFilterModePoint
 // Texture Definitions
+#define cudaPointerAttributes hipPointerAttribute_t
+#define cudaPointerGetAttributes hipPointerGetAttributes
 
 // FFT definitions
 #define cufftDestroy hipfftDestroy
diff --git a/src/utils/hydro_utilities.h b/src/utils/hydro_utilities.h
index 990eb2a83..b89175835 100644
--- a/src/utils/hydro_utilities.h
+++ b/src/utils/hydro_utilities.h
@@ -71,6 +71,40 @@ namespace hydro_utilities {
         return P;
     }
 
+    /*!
+     * \brief Compute the kinetic energy from the density and velocities
+     *
+     * \param[in] d The density
+     * \param[in] vx The x velocity
+     * \param[in] vy The y velocity
+     * \param[in] vz The z velocity
+     * \return Real The kinetic energy
+     */
+    inline __host__ __device__ Real Calc_Kinetic_Energy_From_Velocity(Real const &d,
+                                                                      Real const &vx,
+                                                                      Real const &vy,
+                                                                      Real const &vz)
+    {
+        return 0.5 * d * (vx*vx + vy*vy * vz*vz);
+    }
+
+    /*!
+     * \brief Compute the kinetic energy from the density and momenta
+     *
+     * \param[in] d The density
+     * \param[in] mx The x momentum
+     * \param[in] my The y momentum
+     * \param[in] mz The z momentum
+     * \return Real The kinetic energy
+     */
+    inline __host__ __device__ Real Calc_Kinetic_Energy_From_Momentum(Real const &d,
+                                                                      Real const &mx,
+                                                                      Real const &my,
+                                                                      Real const &mz)
+    {
+        return (0.5 / d) * (mx*mx + my*my * mz*mz);
+    }
+
     inline __host__ __device__ Real Calc_Sound_Speed(Real const &E, Real const &d, Real const &mx, Real const &my, Real const &mz, Real const &gamma) {
         Real P = Calc_Pressure_Conserved(E, d, mx, my, mz, gamma);
         return sqrt(gamma * P / d);
diff --git a/src/utils/hydro_utilities_tests.cpp b/src/utils/hydro_utilities_tests.cpp
index e8a066d12..e0e3cf455 100644
--- a/src/utils/hydro_utilities_tests.cpp
+++ b/src/utils/hydro_utilities_tests.cpp
@@ -127,3 +127,45 @@ TEST(tHYDROHydroUtilsGetPressureFromDE, CorrectInputExpectCorrectOutput) {
         testingUtilities::checkResults(fiducial_Ps.at(i), test_Ps, parameters.names.at(i));
     }
 }
+
+TEST(tHYDROtMHDCalcKineticEnergyFromVelocity, CorrectInputExpectCorrectOutput) {
+    TestParams parameters;
+    std::vector<double> fiducialEnergies{0.0,
+                                         6.307524975350106e-145,
+                                         7.3762470327090601e+249};
+    double const coef = 1E-50;
+
+    for (size_t i = 0; i < parameters.names.size(); i++)
+    {
+        Real testEnergy = hydro_utilities::Calc_Kinetic_Energy_From_Velocity(
+                                                    coef*parameters.d.at(i),
+                                                    coef*parameters.vx.at(i),
+                                                    coef*parameters.vy.at(i),
+                                                    coef*parameters.vz.at(i));
+
+        testingUtilities::checkResults(fiducialEnergies.at(i),
+                                       testEnergy,
+                                       parameters.names.at(i));
+    }
+}
+
+TEST(tHYDROtMHDCalcKineticEnergyFromMomentum, CorrectInputExpectCorrectOutput) {
+    TestParams parameters;
+    std::vector<double> fiducialEnergies{0.0,
+                                         0.0,
+                                         7.2568536478335773e+147};
+    double const coef = 1E-50;
+
+    for (size_t i = 0; i < parameters.names.size(); i++)
+    {
+        Real testEnergy = hydro_utilities::Calc_Kinetic_Energy_From_Momentum(
+                                                    coef*parameters.d.at(i),
+                                                    coef*parameters.mx.at(i),
+                                                    coef*parameters.my.at(i),
+                                                    coef*parameters.mz.at(i));
+
+        testingUtilities::checkResults(fiducialEnergies.at(i),
+                                       testEnergy,
+                                       parameters.names.at(i));
+    }
+}
\ No newline at end of file
diff --git a/src/utils/math_utilities.h b/src/utils/math_utilities.h
new file mode 100644
index 000000000..735cec996
--- /dev/null
+++ b/src/utils/math_utilities.h
@@ -0,0 +1,92 @@
+/*!
+ * \file math_utilities.h
+ * \author Robert 'Bob' Caddy (rvc@pitt.edu)
+ * \brief Contains various functions for common mathematical operations
+ *
+ */
+
+#pragma once
+
+// STL Includes
+#include <cmath>
+#include <tuple>
+
+// External Includes
+
+// Local Includes
+#include "../global/global.h"
+#include "../global/global_cuda.h"
+#include "../utils/gpu.hpp"
+
+namespace math_utils
+{
+    // =========================================================================
+    /*!
+     * \brief Rotate cartesian coordinates. All arguments are cast to double
+     * then rotated. If the type is 'int' then the value is rounded to the
+     * nearest int
+     *
+     * \details Rotation such that when pitch=90 and yaw=0 x1_rot = -x3 and when
+     * pitch=0 and yaw=90 x1_rot = -x2
+     *
+     * \tparam T The return type
+     * \param[in] x_1 x1 coordinate
+     * \param[in] x_2 x2 coordinate
+     * \param[in] x_3 x3 coordinate
+     * \param[in] pitch Pitch angle in radians
+     * \param[in] yaw Yaw angle in radians
+     * \return std::tuple<T, T, T> The new, rotated, coordinates in the
+     * order <x1, x2, x2>. Intended to be captured with structured binding
+     */
+    template<typename T>
+    inline std::tuple<T, T, T> rotateCoords(Real const &x_1, Real const &x_2,
+        Real const &x_3, Real const &pitch, Real const &yaw)
+    {
+        // Compute the sines and cosines. Correct for floating point errors if
+        // the angle is 0.5*M_PI
+        Real const sin_yaw   = std::sin(yaw);
+        Real const cos_yaw   = (yaw==0.5*M_PI)? 0: std::cos(yaw);
+        Real const sin_pitch = std::sin(pitch);
+        Real const cos_pitch = (pitch==0.5*M_PI)? 0: std::cos(pitch);
+
+        // Perform the rotation
+        Real const x_1_rot = (x_1 *  cos_pitch * cos_yaw) + (x_2 * sin_yaw) + (x_3 * sin_pitch * cos_yaw);
+        Real const x_2_rot = (x_1 *  cos_pitch * sin_yaw) + (x_2 * cos_yaw) + (x_3 * sin_pitch * sin_yaw);
+        Real const x_3_rot = (x_1 *  sin_pitch) + (x_3 * cos_pitch);
+
+        if (std::is_same<T, int>::value)
+        {
+            return {round(x_1_rot),
+                    round(x_2_rot),
+                    round(x_3_rot)};
+        }
+        else if (std::is_same<T, Real>::value)
+        {
+            return {x_1_rot, x_2_rot, x_3_rot};
+        }
+    }
+    // =========================================================================
+
+    // =========================================================================
+    /*!
+     * \brief Compute the dot product of a and b.
+     *
+     * \param[in] a1 The first element of a
+     * \param[in] a2 The second element of a
+     * \param[in] a3 The third element of a
+     * \param[in] b1 The first element of b
+     * \param[in] b2 The second element of b
+     * \param[in] b3 The third element of b
+     *
+     * \return Real The dot product of a and b
+     */
+    inline __device__ __host__ Real dotProduct(Real const &a1,
+                                               Real const &a2,
+                                                Real const &a3,
+                                                Real const &b1,
+                                                Real const &b2,
+                                                Real const &b3)
+    {return a1*b1 + ((a2*b2) + (a3*b3));};
+    // =========================================================================
+
+}//math_utils
diff --git a/src/utils/math_utilities_tests.cpp b/src/utils/math_utilities_tests.cpp
new file mode 100644
index 000000000..38a2902d6
--- /dev/null
+++ b/src/utils/math_utilities_tests.cpp
@@ -0,0 +1,64 @@
+/*!
+ * \file math_utilities_tests.cpp
+ * \author Robert 'Bob' Caddy (rvc@pitt.edu)
+ * \brief Tests for the contents of math_utilities.h
+ *
+ */
+
+// STL Includes
+#include <math.h>
+
+// External Includes
+#include <gtest/gtest.h>    // Include GoogleTest and related libraries/headers
+
+// Local Includes
+#include "../utils/testing_utilities.h"
+#include "../utils/math_utilities.h"
+#include "../global/global.h"
+
+// =============================================================================
+TEST(tALLRotateCoords,
+     CorrectInputExpectCorrectOutput)
+{
+    // Fiducial values
+    double const x_1         = 19.2497333410;
+    double const x_2         = 60.5197699003;
+    double const x_3         = 86.0613942621;
+    double const pitch       = 1.239 * M_PI;
+    double const yaw         = 0.171 * M_PI;
+    double const x_1_rot_fid = -31.565679455456568;
+    double const x_2_rot_fid =  14.745363873361605;
+    double const x_3_rot_fid = -76.05402749550727;
+
+    auto [x_1_rot, x_2_rot, x_3_rot] = math_utils::rotateCoords<double>(x_1, x_2, x_3, pitch, yaw);
+
+    testingUtilities::checkResults<0>(x_1_rot_fid, x_1_rot, "x_1 rotated values");
+    testingUtilities::checkResults<0>(x_2_rot_fid, x_2_rot, "x_2 rotated values");
+    testingUtilities::checkResults<0>(x_3_rot_fid, x_3_rot, "x_3 rotated values");
+}
+// =============================================================================
+
+// =========================================================================
+/*!
+    * \brief Test the math_utils::dotProduct function
+    *
+    */
+TEST(tALLDotProduct,
+     CorrectInputExpectCorrectOutput)
+{
+    std::vector<double> a{21.503067766457753, 48.316634031589935, 81.12177317622657},
+                        b{38.504606872151484, 18.984145880030045, 89.52561861038686};
+
+    double const fiducialDotProduct = 9007.6941261535867;
+
+    double testDotProduct;
+
+    testDotProduct = math_utils::dotProduct(a.at(0), a.at(1), a.at(2),
+                                            b.at(0), b.at(1), b.at(2));
+
+    // Now check results
+    testingUtilities::checkResults(fiducialDotProduct,
+                                    testDotProduct,
+                                    "dot product");
+}
+// =========================================================================
\ No newline at end of file
diff --git a/src/utils/mhd_utilities.cpp b/src/utils/mhd_utilities.cpp
deleted file mode 100644
index c7747830e..000000000
--- a/src/utils/mhd_utilities.cpp
+++ /dev/null
@@ -1,18 +0,0 @@
-/*!
- * \file mhd_utilities.cpp
- * \author Robert 'Bob' Caddy (rvc@pitt.edu)
- * \brief Contains the implementation of various utility functions for MHD
- *
- */
-
-// STL Includes
-
-// External Includes
-
-// Local Includes
-#include "../utils/mhd_utilities.h"
-
-namespace mhdUtils
-{
-
-} // end  namespace mhdUtils
\ No newline at end of file
diff --git a/src/utils/mhd_utilities.cu b/src/utils/mhd_utilities.cu
new file mode 100644
index 000000000..9e947b6c6
--- /dev/null
+++ b/src/utils/mhd_utilities.cu
@@ -0,0 +1,25 @@
+/*!
+ * \file mhd_utilities.cpp
+ * \author Robert 'Bob' Caddy (rvc@pitt.edu)
+ * \brief Contains the implementation of various utility functions for MHD and
+ * for the various kernels, functions, and tools required for the 3D VL+CT MHD
+ * integrator. Due to the CUDA/HIP compiler requiring that device functions be
+ * directly accessible to the file they're used in most device functions will be
+ * implemented in the header file
+ *
+ */
+
+// STL Includes
+
+// External Includes
+
+// Local Includes
+#include "../utils/mhd_utilities.h"
+
+namespace mhd{
+namespace utils
+{
+
+}//utils
+
+} // end namespace mhd
\ No newline at end of file
diff --git a/src/utils/mhd_utilities.h b/src/utils/mhd_utilities.h
index f28cbb400..d859ab1db 100644
--- a/src/utils/mhd_utilities.h
+++ b/src/utils/mhd_utilities.h
@@ -15,14 +15,17 @@
 #include "../global/global.h"
 #include "../global/global_cuda.h"
 #include "../utils/gpu.hpp"
+#include "../utils/cuda_utilities.h"
 
-/*!
- * \brief Namespace for MHD utilities
- *
- */
-namespace mhdUtils
-{
-    namespace // Anonymouse namespace
+namespace mhd{
+namespace utils{
+    /*!
+     * \brief Namespace for functions required by functions within the mhd::utils
+     * namespace. Everything in this name space should be regarded as private
+     * but is made accesible for testing
+     *
+     */
+    namespace _internal
     {
         // =====================================================================
         /*!
@@ -59,11 +62,12 @@ namespace mhdUtils
             return sqrt( (term1 + waveChoice * term2) / (2.0 * fmax(density, TINY_NUMBER)) );
         }
         // =====================================================================
-    }// Anonymouse namespace
+    }// mhd::utils::_internal namespace
 
     // =========================================================================
     /*!
-     * \brief Compute the MHD energy in the cell
+     * \brief Compute the energy in a cell. If MHD is not defined then simply
+     * return the hydro only energy
      *
      * \param[in] pressure The gas pressure
      * \param[in] density The density
@@ -87,9 +91,13 @@ namespace mhdUtils
                                                   Real const &gamma)
     {
         // Compute and return energy
-        return (fmax(pressure,TINY_NUMBER)/(gamma - 1.))
-                + 0.5 * density * (velocityX*velocityX + ((velocityY*velocityY) + (velocityZ*velocityZ)))
-                + 0.5 * (magneticX*magneticX + ((magneticY*magneticY) + (magneticZ*magneticZ)));
+        Real energy =  (fmax(pressure,TINY_NUMBER)/(gamma - 1.))
+                       + 0.5 * density * (velocityX*velocityX + ((velocityY*velocityY) + (velocityZ*velocityZ)));
+        #ifdef  MHD
+            energy += 0.5 * (magneticX*magneticX + ((magneticY*magneticY) + (magneticZ*magneticZ)));
+        #endif  //MHD
+
+        return energy;
     }
     // =========================================================================
 
@@ -157,6 +165,23 @@ namespace mhdUtils
     }
     // =========================================================================
 
+    // =========================================================================
+    /*!
+     * \brief Compute the magnetic energy
+     *
+     * \param[in] magneticX The magnetic field in the X-direction
+     * \param[in] magneticY The magnetic field in the Y-direction
+     * \param[in] magneticZ The magnetic field in the Z-direction
+     * \return Real The magnetic energy
+     */
+    inline __host__ __device__ Real computeMagneticEnergy(Real const &magneticX,
+                                                          Real const &magneticY,
+                                                          Real const &magneticZ)
+    {
+        return 0.5 * (magneticX*magneticX + ((magneticY*magneticY) + (magneticZ*magneticZ)));
+    }
+    // =========================================================================
+
     // =========================================================================
     /*!
      * \brief Compute the total MHD pressure. I.e. magnetic pressure + gas
@@ -199,13 +224,13 @@ namespace mhdUtils
                                                           Real const &gamma)
     {
         // Compute the sound speed
-        return _magnetosonicSpeed(density,
-                                  pressure,
-                                  magneticX,
-                                  magneticY,
-                                  magneticZ,
-                                  gamma,
-                                  1.0);
+        return mhd::utils::_internal::_magnetosonicSpeed(density,
+                                                      pressure,
+                                                      magneticX,
+                                                      magneticY,
+                                                      magneticZ,
+                                                      gamma,
+                                                      1.0);
     }
     // =========================================================================
 
@@ -229,13 +254,13 @@ namespace mhdUtils
                                                           Real const &gamma)
     {
         // Compute the sound speed
-        return _magnetosonicSpeed(density,
-                                  pressure,
-                                  magneticX,
-                                  magneticY,
-                                  magneticZ,
-                                  gamma,
-                                  -1.0);
+        return mhd::utils::_internal::_magnetosonicSpeed(density,
+                                                      pressure,
+                                                      magneticX,
+                                                      magneticY,
+                                                      magneticZ,
+                                                      gamma,
+                                                      -1.0);
     }
     // =========================================================================
 
@@ -285,10 +310,20 @@ namespace mhdUtils
                                                                Real &avgBy,
                                                                Real &avgBz)
     {
-        avgBx = 0.5 * (dev_conserved[(5+NSCALARS)*n_cells + id] + dev_conserved[(5+NSCALARS)*n_cells + ((xid-1) + yid*nx     + zid*nx*ny)]);
-        avgBy = 0.5 * (dev_conserved[(6+NSCALARS)*n_cells + id] + dev_conserved[(6+NSCALARS)*n_cells + (xid     + (yid-1)*nx + zid*nx*ny)]);
-        avgBz = 0.5 * (dev_conserved[(7+NSCALARS)*n_cells + id] + dev_conserved[(7+NSCALARS)*n_cells + (xid     + yid*nx     + (zid-1)*nx*ny)]);
+        // Ternary operator to check that no values outside of the magnetic field
+        // arrays are loaded. If the cell is on the edge that doesn't have magnetic
+        // fields on both sides then instead set the centered magnetic field to be
+        // equal to the magnetic field of the closest edge. T
+        avgBx = (xid > 0) ?
+            /*if true*/ 0.5 * (dev_conserved[(5+NSCALARS)*n_cells + id] + dev_conserved[(5+NSCALARS)*n_cells + cuda_utilities::compute1DIndex(xid-1, yid,   zid,   nx, ny)]):
+            /*if false*/       dev_conserved[(5+NSCALARS)*n_cells + id];
+        avgBy = (yid > 0) ?
+            /*if true*/ 0.5 * (dev_conserved[(6+NSCALARS)*n_cells + id] + dev_conserved[(6+NSCALARS)*n_cells + cuda_utilities::compute1DIndex(xid,   yid-1, zid,   nx, ny)]):
+            /*if false*/       dev_conserved[(6+NSCALARS)*n_cells + id];
+        avgBz = (zid > 0) ?
+            /*if true*/ 0.5 * (dev_conserved[(7+NSCALARS)*n_cells + id] + dev_conserved[(7+NSCALARS)*n_cells + cuda_utilities::compute1DIndex(xid,   yid,   zid-1, nx, ny)]):
+            /*if false*/       dev_conserved[(7+NSCALARS)*n_cells + id];
     }
     // =========================================================================
-
-} // end  namespace mhdUtils
\ No newline at end of file
+} // end namespace mhd::utils
+} // end namespace mhd
\ No newline at end of file
diff --git a/src/utils/mhd_utilities_tests.cpp b/src/utils/mhd_utilities_tests.cu
similarity index 81%
rename from src/utils/mhd_utilities_tests.cpp
rename to src/utils/mhd_utilities_tests.cu
index c5cbb25fb..d56ae2bad 100644
--- a/src/utils/mhd_utilities_tests.cpp
+++ b/src/utils/mhd_utilities_tests.cu
@@ -11,6 +11,7 @@
 #include <iostream>
 #include <numeric>
 #include <cmath>
+#include <random>
 
 // External Includes
 #include <gtest/gtest.h>    // Include GoogleTest and related libraries/headers
@@ -45,12 +46,11 @@ namespace
 }
 // =============================================================================
 
-
 // =============================================================================
-// Tests for the mhdUtils::computeEnergy function
+// Tests for the mhd::utils::computeEnergy function
 // =============================================================================
 /*!
- * \brief Test the mhdUtils::computeEnergy function with the standard set of
+ * \brief Test the mhd::utils::computeEnergy function with the standard set of
  * parameters
  *
  */
@@ -64,7 +64,7 @@ TEST(tMHDComputeEnergy,
 
     for (size_t i = 0; i < parameters.names.size(); i++)
     {
-        Real testEnergy = mhdUtils::computeEnergy(parameters.pressureGas.at(i),
+        Real testEnergy = mhd::utils::computeEnergy(parameters.pressureGas.at(i),
                                                   parameters.density.at(i),
                                                   parameters.velocityX.at(i),
                                                   parameters.velocityY.at(i),
@@ -81,7 +81,7 @@ TEST(tMHDComputeEnergy,
 }
 
 /*!
- * \brief Test the mhdUtils::computeEnergy function with a the standard set of
+ * \brief Test the mhd::utils::computeEnergy function with a the standard set of
  * parameters except pressure is now negative
  *
  */
@@ -95,7 +95,7 @@ TEST(tMHDComputeEnergy,
 
     for (size_t i = 0; i < parameters.names.size(); i++)
     {
-        Real testEnergy = mhdUtils::computeEnergy(-parameters.pressureGas.at(i),
+        Real testEnergy = mhd::utils::computeEnergy(-parameters.pressureGas.at(i),
                                                   parameters.density.at(i),
                                                   parameters.velocityX.at(i),
                                                   parameters.velocityY.at(i),
@@ -111,14 +111,14 @@ TEST(tMHDComputeEnergy,
     }
 }
 // =============================================================================
-// End of tests for the mhdUtils::computeEnergy function
+// End of tests for the mhd::utils::computeEnergy function
 // =============================================================================
 
 // =============================================================================
-// Tests for the mhdUtils::computeGasPressure function
+// Tests for the mhd::utils::computeGasPressure function
 // =============================================================================
 /*!
- * \brief Test the mhdUtils::computeGasPressure function with the standard set of
+ * \brief Test the mhd::utils::computeGasPressure function with the standard set of
  * parameters. Energy has been increased to avoid negative pressures
  *
  */
@@ -133,7 +133,7 @@ TEST(tMHDComputeGasPressure,
 
     for (size_t i = 0; i < parameters.names.size(); i++)
     {
-        Real testGasPressure = mhdUtils::computeGasPressure(energyMultiplier.at(i) * parameters.energy.at(i),
+        Real testGasPressure = mhd::utils::computeGasPressure(energyMultiplier.at(i) * parameters.energy.at(i),
                                                             parameters.density.at(i),
                                                             parameters.momentumX.at(i),
                                                             parameters.momentumY.at(i),
@@ -150,7 +150,7 @@ TEST(tMHDComputeGasPressure,
 }
 
 /*!
- * \brief Test the mhdUtils::computeGasPressure function with a the standard set
+ * \brief Test the mhd::utils::computeGasPressure function with a the standard set
  * of parameters which produce negative pressures
  *
  */
@@ -161,7 +161,7 @@ TEST(tMHDComputeGasPressure,
 
     for (size_t i = 0; i < parameters.names.size(); i++)
     {
-        Real testGasPressure = mhdUtils::computeGasPressure(parameters.energy.at(i),
+        Real testGasPressure = mhd::utils::computeGasPressure(parameters.energy.at(i),
                                                             parameters.density.at(i),
                                                             parameters.momentumX.at(i),
                                                             parameters.momentumY.at(i),
@@ -178,15 +178,15 @@ TEST(tMHDComputeGasPressure,
     }
 }
 // =============================================================================
-// End of tests for the mhdUtils::computeGasPressure function
+// End of tests for the mhd::utils::computeGasPressure function
 // =============================================================================
 
 
 // =============================================================================
-// Tests for the mhdUtils::computeThermalEnergy function
+// Tests for the mhd::utils::computeThermalEnergy function
 // =============================================================================
 /*!
- * \brief Test the mhdUtils::computeThermalEnergy function with the standard set
+ * \brief Test the mhd::utils::computeThermalEnergy function with the standard set
  * of parameters.
  *
  */
@@ -201,7 +201,7 @@ TEST(tMHDComputeThermalEnergy,
 
     for (size_t i = 0; i < parameters.names.size(); i++)
     {
-        Real testGasPressure = mhdUtils::computeThermalEnergy(energyMultiplier.at(i) * parameters.energy.at(i),
+        Real testGasPressure = mhd::utils::computeThermalEnergy(energyMultiplier.at(i) * parameters.energy.at(i),
                                                               parameters.density.at(i),
                                                               parameters.momentumX.at(i),
                                                               parameters.momentumY.at(i),
@@ -217,14 +217,46 @@ TEST(tMHDComputeThermalEnergy,
     }
 }
 // =============================================================================
-// End of tests for the mhdUtils::computeThermalEnergyfunction
+// End of tests for the mhd::utils::computeThermalEnergy function
+// =============================================================================
+
+// =============================================================================
+// Tests for the mhd::utils::computeMagneticEnergy function
+// =============================================================================
+/*!
+ * \brief Test the mhd::utils::computeMagneticEnergy function with the standard
+ * set of parameters.
+ *
+ */
+TEST(tMHDcomputeMagneticEnergy,
+     CorrectInputExpectCorrectOutput)
+{
+    testParams parameters;
+    std::vector<double> energyMultiplier{1.0E85, 1.0E4, 1.0E105};
+    std::vector<double> fiducialEnergy{0.0,
+                                       805356.08013056568,
+                                       6.7079331637514162e+201};
+
+    for (size_t i = 0; i < parameters.names.size(); i++)
+    {
+        Real testMagneticEnergy = mhd::utils::computeMagneticEnergy(parameters.magneticX.at(i),
+                                                                  parameters.magneticY.at(i),
+                                                                  parameters.magneticZ.at(i));
+
+        testingUtilities::checkResults(fiducialEnergy.at(i),
+                                       testMagneticEnergy,
+                                       parameters.names.at(i));
+    }
+}
+// =============================================================================
+// End of tests for the mhd::utils::computeMagneticEnergy function
 // =============================================================================
 
 // =============================================================================
-// Tests for the mhdUtils::computeTotalPressure function
+// Tests for the mhd::utils::computeTotalPressure function
 // =============================================================================
 /*!
- * \brief Test the mhdUtils::computeTotalPressure function with the standard set
+ * \brief Test the mhd::utils::computeTotalPressure function with the standard set
  * of parameters.
  *
  */
@@ -238,7 +270,7 @@ TEST(tMHDComputeTotalPressure,
 
     for (size_t i = 0; i < parameters.names.size(); i++)
     {
-        Real testTotalPressure = mhdUtils::computeTotalPressure(parameters.pressureGas.at(i),
+        Real testTotalPressure = mhd::utils::computeTotalPressure(parameters.pressureGas.at(i),
                                                                 parameters.magneticX.at(i),
                                                                 parameters.magneticY.at(i),
                                                                 parameters.magneticZ.at(i));
@@ -250,7 +282,7 @@ TEST(tMHDComputeTotalPressure,
 }
 
 /*!
- * \brief Test the mhdUtils::computeTotalPressure function with a the standard
+ * \brief Test the mhd::utils::computeTotalPressure function with a the standard
  * set of parameters. Gas pressure has been multiplied and made negative to
  * generate negative total pressures
  *
@@ -263,7 +295,7 @@ TEST(tMHDComputeTotalPressure,
 
     for (size_t i = 0; i < parameters.names.size(); i++)
     {
-        Real testTotalPressure = mhdUtils::computeTotalPressure(pressureMultiplier.at(i) * parameters.pressureGas.at(i),
+        Real testTotalPressure = mhd::utils::computeTotalPressure(pressureMultiplier.at(i) * parameters.pressureGas.at(i),
                                                                 parameters.magneticX.at(i),
                                                                 parameters.magneticY.at(i),
                                                                 parameters.magneticZ.at(i));
@@ -275,14 +307,14 @@ TEST(tMHDComputeTotalPressure,
     }
 }
 // =============================================================================
-// End of tests for the mhdUtils::computeTotalPressure function
+// End of tests for the mhd::utils::computeTotalPressure function
 // =============================================================================
 
 // =============================================================================
-// Tests for the mhdUtils::fastMagnetosonicSpeed function
+// Tests for the mhd::utils::fastMagnetosonicSpeed function
 // =============================================================================
 /*!
- * \brief Test the mhdUtils::fastMagnetosonicSpeed function with the standard
+ * \brief Test the mhd::utils::fastMagnetosonicSpeed function with the standard
  * set of parameters. All values are reduced by 1e-25 in the large number case
  * to avoid overflow
  *
@@ -298,7 +330,7 @@ TEST(tMHDFastMagnetosonicSpeed,
 
     for (size_t i = 0; i < parameters.names.size(); i++)
     {
-        Real testFastMagnetosonicSpeed = mhdUtils::fastMagnetosonicSpeed(
+        Real testFastMagnetosonicSpeed = mhd::utils::fastMagnetosonicSpeed(
                                                 coef.at(i)*parameters.density.at(i),
                                                 coef.at(i)*parameters.pressureGas.at(i),
                                                 coef.at(i)*parameters.magneticX.at(i),
@@ -313,7 +345,7 @@ TEST(tMHDFastMagnetosonicSpeed,
 }
 
 /*!
- * \brief Test the mhdUtils::fastMagnetosonicSpeed function with the standard
+ * \brief Test the mhd::utils::fastMagnetosonicSpeed function with the standard
  * set of parameters, density is negative. All values are reduced by 1e-25 in
  * the large number case to avoid overflow.
  *
@@ -329,7 +361,7 @@ TEST(tMHDFastMagnetosonicSpeed,
 
     for (size_t i = 0; i < parameters.names.size(); i++)
     {
-        Real testFastMagnetosonicSpeed = mhdUtils::fastMagnetosonicSpeed(
+        Real testFastMagnetosonicSpeed = mhd::utils::fastMagnetosonicSpeed(
                                                 -coef.at(i)*parameters.density.at(i),
                                                 coef.at(i)*parameters.pressureGas.at(i),
                                                 coef.at(i)*parameters.magneticX.at(i),
@@ -343,14 +375,14 @@ TEST(tMHDFastMagnetosonicSpeed,
     }
 }
 // =============================================================================
-// End of tests for the mhdUtils::fastMagnetosonicSpeed function
+// End of tests for the mhd::utils::fastMagnetosonicSpeed function
 // =============================================================================
 
 // =============================================================================
-// Tests for the mhdUtils::slowMagnetosonicSpeed function
+// Tests for the mhd::utils::slowMagnetosonicSpeed function
 // =============================================================================
 /*!
- * \brief Test the mhdUtils::slowMagnetosonicSpeed function with the standard
+ * \brief Test the mhd::utils::slowMagnetosonicSpeed function with the standard
  * set of parameters. All values are reduced by 1e-25 in the large number case
  * to avoid overflow
  *
@@ -367,7 +399,7 @@ TEST(tMHDSlowMagnetosonicSpeed,
 
     for (size_t i = 2; i < parameters.names.size(); i++)
     {
-        Real testSlowMagnetosonicSpeed = mhdUtils::slowMagnetosonicSpeed(
+        Real testSlowMagnetosonicSpeed = mhd::utils::slowMagnetosonicSpeed(
                                                 parameters.density.at(i) * coef,
                                                 parameters.pressureGas.at(i) * coef,
                                                 parameters.magneticX.at(i) * coef,
@@ -382,7 +414,7 @@ TEST(tMHDSlowMagnetosonicSpeed,
 }
 
 /*!
- * \brief Test the mhdUtils::slowMagnetosonicSpeed function with the standard
+ * \brief Test the mhd::utils::slowMagnetosonicSpeed function with the standard
  * set of parameters, density is negative. All values are reduced by 1e-25 in
  * the large number case to avoid overflow.
  *
@@ -399,7 +431,7 @@ TEST(tMHDSlowMagnetosonicSpeed,
 
     for (size_t i = 2; i < parameters.names.size(); i++)
     {
-        Real testSlowMagnetosonicSpeed = mhdUtils::slowMagnetosonicSpeed(
+        Real testSlowMagnetosonicSpeed = mhd::utils::slowMagnetosonicSpeed(
                                                 -parameters.density.at(i) * coef,
                                                 parameters.pressureGas.at(i) * coef,
                                                 parameters.magneticX.at(i) * coef,
@@ -413,14 +445,14 @@ TEST(tMHDSlowMagnetosonicSpeed,
     }
 }
 // =============================================================================
-// End of tests for the mhdUtils::slowMagnetosonicSpeed function
+// End of tests for the mhd::utils::slowMagnetosonicSpeed function
 // =============================================================================
 
 // =============================================================================
-// Tests for the mhdUtils::alfvenSpeed function
+// Tests for the mhd::utils::alfvenSpeed function
 // =============================================================================
 /*!
- * \brief Test the mhdUtils::alfvenSpeed function with the standard set of
+ * \brief Test the mhd::utils::alfvenSpeed function with the standard set of
  * parameters.
  *
  */
@@ -434,7 +466,7 @@ TEST(tMHDAlfvenSpeed,
 
     for (size_t i = 0; i < parameters.names.size(); i++)
     {
-        Real testAlfvenSpeed = mhdUtils::alfvenSpeed(parameters.magneticX.at(i),
+        Real testAlfvenSpeed = mhd::utils::alfvenSpeed(parameters.magneticX.at(i),
                                                      parameters.density.at(i));
 
         testingUtilities::checkResults(fiducialAlfvenSpeed.at(i),
@@ -444,7 +476,7 @@ TEST(tMHDAlfvenSpeed,
 }
 
 /*!
- * \brief Test the mhdUtils::alfvenSpeed function with the standard set of
+ * \brief Test the mhd::utils::alfvenSpeed function with the standard set of
  * parameters except density is negative
  *
  */
@@ -458,7 +490,7 @@ TEST(tMHDAlfvenSpeed,
 
     for (size_t i = 0; i < parameters.names.size(); i++)
     {
-        Real testAlfvenSpeed = mhdUtils::alfvenSpeed(parameters.magneticX.at(i),
+        Real testAlfvenSpeed = mhd::utils::alfvenSpeed(parameters.magneticX.at(i),
                                                      -parameters.density.at(i));
 
         testingUtilities::checkResults(fiducialAlfvenSpeed.at(i),
@@ -467,11 +499,11 @@ TEST(tMHDAlfvenSpeed,
     }
 }
 // =============================================================================
-// End of tests for the mhdUtils::alfvenSpeed function
+// End of tests for the mhd::utils::alfvenSpeed function
 // =============================================================================
 
 // =============================================================================
-// Tests for the mhdUtils::cellCenteredMagneticFields function
+// Tests for the mhd::utils::cellCenteredMagneticFields function
 // =============================================================================
 TEST(tMHDCellCenteredMagneticFields,
      CorrectInputExpectCorrectOutput)
@@ -497,7 +529,7 @@ TEST(tMHDCellCenteredMagneticFields,
     double testAvgBx, testAvgBy, testAvgBz;
 
     // Call the function to test
-    mhdUtils::cellCenteredMagneticFields(testGrid.data(), id, xid, yid, zid, n_cells, nx, ny, testAvgBx, testAvgBy, testAvgBz);
+    mhd::utils::cellCenteredMagneticFields(testGrid.data(), id, xid, yid, zid, n_cells, nx, ny, testAvgBx, testAvgBy, testAvgBz);
 
     // Check the results
     testingUtilities::checkResults(fiducialAvgBx, testAvgBx, "cell centered Bx value");
@@ -505,5 +537,5 @@ TEST(tMHDCellCenteredMagneticFields,
     testingUtilities::checkResults(fiducialAvgBz, testAvgBz, "cell centered Bz value");
 }
 // =============================================================================
-// End of tests for the mhdUtils::cellCenteredMagneticFields function
+// End of tests for the mhd::utils::cellCenteredMagneticFields function
 // =============================================================================
diff --git a/src/utils/reduction_utilities.cu b/src/utils/reduction_utilities.cu
index 820f27826..65933e42f 100644
--- a/src/utils/reduction_utilities.cu
+++ b/src/utils/reduction_utilities.cu
@@ -42,19 +42,5 @@
             gridReduceMax(maxVal, out);
         }
         // =====================================================================
-
-        // =====================================================================
-        void reductionLaunchParams(uint &numBlocks, uint &threadsPerBlock, uint const &deviceNum)
-        {
-            cudaDeviceProp prop;
-            cudaGetDeviceProperties(&prop, deviceNum);
-
-            // Divide the total number of allowed threads by the number of
-            // threads per block
-            threadsPerBlock =  prop.maxThreadsPerBlock;
-            numBlocks       = (prop.maxThreadsPerMultiProcessor * prop.multiProcessorCount)
-                              / threadsPerBlock;
-        }
-        // =====================================================================
     }//reduction_utilities
 #endif  //CUDA
\ No newline at end of file
diff --git a/src/utils/reduction_utilities.h b/src/utils/reduction_utilities.h
index 6935d481b..9aef9600d 100644
--- a/src/utils/reduction_utilities.h
+++ b/src/utils/reduction_utilities.h
@@ -8,7 +8,7 @@
 #pragma once
 
 // STL Includes
-#include <float.h>
+#include <cstdint>
 
 // External Includes
 
@@ -78,7 +78,99 @@
         }
         // =====================================================================
 
+        #ifndef O_HIP
         // =====================================================================
+        // This section handles the atomics. It is complicated because CUDA
+        // doesn't currently support atomics with non-integral types.
+        // This code is taken from
+        // https://github.com/rapidsai/cuml/blob/dc14361ba11c41f7a4e1e6a3625bbadd0f52daf7/cpp/src_prims/stats/minmax.cuh
+        // with slight tweaks for our use case.
+        // =====================================================================
+        /*!
+         * \brief Do a device side bit cast
+         *
+         * \tparam To The output type
+         * \tparam From The input type
+         * \param from The input value
+         * \return To The bit cast version of From as type To
+         */
+        template <class To, class From>
+        __device__ constexpr To bit_cast(const From& from) noexcept
+        {
+            // TODO: replace with `std::bitcast` once we adopt C++20 or libcu++ adds it
+            To to{};
+            static_assert(sizeof(To) == sizeof(From));
+            memcpy(&to, &from, sizeof(To));
+            return to;
+        }
+
+        /*!
+         * \brief Encode a float as an int
+         *
+         * \param val The float to encode
+         * \return int The encoded int
+         */
+        inline __device__ int encode(float val)
+        {
+            int i = bit_cast<int>(val);
+            return i >= 0 ? i : (1 << 31) | ~i;
+        }
+
+        /*!
+         * \brief Encode a double as a long long int
+         *
+         * \param val The double to encode
+         * \return long long The encoded long long int
+         */
+        inline __device__ long long encode(double val)
+        {
+            std::int64_t i = bit_cast<std::int64_t>(val);
+            return i >= 0 ? i : (1ULL << 63) | ~i;
+        }
+
+        /*!
+         * \brief Decodes an int as a float
+         *
+         * \param val The int to decode
+         * \return float The decoded float
+         */
+        inline __device__ float decode(int val)
+        {
+            if (val < 0) val = (1 << 31) | ~val;
+            return bit_cast<float>(val);
+        }
+
+        /*!
+         * \brief Decodes a long long int as a double
+         *
+         * \param val The long long to decode
+         * \return double The decoded double
+         */
+        inline __device__ double decode(long long val)
+        {
+            if (val < 0) val = (1ULL << 63) | ~val;
+            return bit_cast<double>(val);
+        }
+        #endif  //O_HIP
+        /*!
+        * \brief Perform an atomic reduction to find the maximum value of `val`
+        *
+        * \param[out] address The pointer to where to store the reduced scalar
+        * value in device memory
+        * \param[in] val The thread local variable to find the maximum of across
+        * the grid. Typically this should be a partial reduction that has
+        * already been reduced to the block level
+        */
+        inline __device__ float atomicMaxBits(float* address, float val)
+        {
+            #ifdef O_HIP
+                return atomicMax(address, val);
+            #else //O_HIP
+                int old = atomicMax((int*)address, encode(val));
+                return decode(old);
+            #endif //O_HIP
+        }
+
         /*!
         * \brief Perform an atomic reduction to find the maximum value of `val`
         *
@@ -88,27 +180,52 @@
         * the grid. Typically this should be a partial reduction that has
         * already been reduced to the block level
         */
-        __inline__ __device__ double atomicMax_double(double* address, double val)
+        inline __device__ double atomicMaxBits(double* address, double val)
+        {
+            #ifdef O_HIP
+                return atomicMax(address, val);
+            #else //O_HIP
+                long long old = atomicMax((long long*)address, encode(val));
+                return decode(old);
+            #endif //O_HIP
+        }
+
+        /*!
+        * \brief Perform an atomic reduction to find the minimum value of `val`
+        *
+        * \param[out] address The pointer to where to store the reduced scalar
+        * value in device memory
+        * \param[in] val The thread local variable to find the minimum of across
+        * the grid. Typically this should be a partial reduction that has
+        * already been reduced to the block level
+        */
+        inline __device__ float atomicMinBits(float* address, float val)
         {
-            unsigned long long int* address_as_ull = (unsigned long long int*) address;
-            unsigned long long int old = *address_as_ull, assumed;
-            // Explanation of loop here:
-            // https://stackoverflow.com/questions/16077464/atomicadd-for-double-on-gpu
-            // The loop is to make sure the value at address doesn't change
-            // between the load at the atomic since the entire operation isn't
-            // atomic
-
-            // While it appears that this could result in many times more atomic
-            // operations than required, in practice it's only a handful of
-            // extra operation even in the worst case. Running with 16,000
-            // blocks gives ~8-37 atomics after brief testing
-            do {
-                assumed = old;
-                old = atomicCAS(address_as_ull,
-                                assumed,
-                                __double_as_longlong(fmax(__longlong_as_double(assumed),val)));
-            } while (assumed != old);
-            return __longlong_as_double(old);
+            #ifdef O_HIP
+                return atomicMin(address, val);
+            #else //O_HIP
+                int old = atomicMin((int*)address, encode(val));
+                return decode(old);
+            #endif //O_HIP
+        }
+
+        /*!
+        * \brief Perform an atomic reduction to find the minimum value of `val`
+        *
+        * \param[out] address The pointer to where to store the reduced scalar
+        * value in device memory
+        * \param[in] val The thread local variable to find the minimum of across
+        * the grid. Typically this should be a partial reduction that has
+        * already been reduced to the block level
+        */
+        inline __device__ double atomicMinBits(double* address, double val)
+        {
+            #ifdef O_HIP
+                return atomicMin(address, val);
+            #else //O_HIP
+                long long old = atomicMin((long long*)address, encode(val));
+                return decode(old);
+            #endif //O_HIP
         }
         // =====================================================================
 
@@ -119,6 +236,10 @@
          * before the kernel launch that uses this function to avoid any
          * potential race condition; the `cuda_utilities::setScalarDeviceMemory`
          * function exists for this purpose.
+         * of `val`. Note that the value of `out` should be set appropriately
+         * before the kernel launch that uses this function to avoid any
+         * potential race condition; the `cuda_utilities::setScalarDeviceMemory`
+         * function exists for this purpose.
          *
          * \details This function can perform a reduction to find the maximum of
          * the thread local variable `val` across the entire grid. It relies on a
@@ -128,7 +249,7 @@
          * by using as many threads per block as possible and as few blocks as
          * possible since each block has to perform an atomic operation. To
          * accomplish this it is reccommened that you use the
-         * `reductionLaunchParams` functions to get the optimal number of blocks
+         * `AutomaticLaunchParams` functions to get the optimal number of blocks
          * and threads per block to launch rather than relying on Cholla defaults
          * and then within the kernel using a grid-stride loop to make sure the
          * kernel works with any combination of threads and blocks. Note that
@@ -147,17 +268,23 @@
         __inline__ __device__ void gridReduceMax(Real val, Real* out)
         {
             // __syncthreads();  // Wait for all threads to calculate val;
+            // __syncthreads();  // Wait for all threads to calculate val;
 
             // Reduce the entire block in parallel
             val = blockReduceMax(val);
 
             // Write block level reduced value to the output scalar atomically
-            if (threadIdx.x == 0) atomicMax_double(out, val);
+            if (threadIdx.x == 0) atomicMaxBits(out, val);
         }
         // =====================================================================
 
         // =====================================================================
         /*!
+         * \brief Find the maximum value in the array. Make sure to initialize
+         * `out` correctly before using this kernel; the
+         * `cuda_utilities::setScalarDeviceMemory` function exists for this
+         * purpose. If `in` and `out` are the same array that's ok, all the
+         * loads are completed before the overwrite occurs.
          * \brief Find the maximum value in the array. Make sure to initialize
          * `out` correctly before using this kernel; the
          * `cuda_utilities::setScalarDeviceMemory` function exists for this
@@ -171,23 +298,5 @@
          */
         __global__ void kernelReduceMax(Real *in, Real* out, size_t N);
         // =====================================================================
-
-        // =====================================================================
-        /*!
-        * \brief Determine the optimal number of blocks and threads per block to
-        * use when launching a reduction kernel
-        *
-        * \param[out] numBlocks The maximum number of blocks that are
-        * scheduleable by the device in use when each block has the maximum
-        * number of threads
-        * \param[out] threadsPerBlock The maximum threads per block supported by
-        * the device in use
-        * \param[in] deviceNum optional: which device is being targeted.
-        * Defaults to zero
-        */
-        void reductionLaunchParams(uint &numBlocks,
-                                   uint &threadsPerBlock,
-                                   uint const &deviceNum=0);
-        // =====================================================================
     }  // namespace reduction_utilities
 #endif  //CUDA
diff --git a/src/utils/reduction_utilities_tests.cu b/src/utils/reduction_utilities_tests.cu
index 2314b33be..64613cc5b 100644
--- a/src/utils/reduction_utilities_tests.cu
+++ b/src/utils/reduction_utilities_tests.cu
@@ -17,6 +17,8 @@
 // Local Includes
 #include "../utils/testing_utilities.h"
 #include "../utils/reduction_utilities.h"
+#include "../utils/cuda_utilities.h"
+#include "../utils/DeviceVector.h"
 #include "../global/global.h"
 
 
@@ -28,8 +30,7 @@ TEST(tALLKernelReduceMax, CorrectInputExpectCorrectOutput)
 {
     // Launch parameters
     // =================
-    uint numBlocks, threadsPerBlock;
-    reduction_utilities::reductionLaunchParams(numBlocks, threadsPerBlock);
+    cuda_utilities::AutomaticLaunchParams static const launchParams(reduction_utilities::kernelReduceMax);
 
     // Grid Parameters & testing parameters
     // ====================================
@@ -37,7 +38,6 @@ TEST(tALLKernelReduceMax, CorrectInputExpectCorrectOutput)
     size_t const size     = std::pow(gridSize, 3);;
     Real   const maxValue = 4;
     std::vector<Real> host_grid(size);
-    Real host_max = -DBL_MAX;
 
     // Fill grid with random values and assign maximum value
     std::mt19937 prng(1);
@@ -52,44 +52,22 @@ TEST(tALLKernelReduceMax, CorrectInputExpectCorrectOutput)
 
     // Allocating and copying to device
     // ================================
-    Real *dev_grid;
-    CudaSafeCall(cudaMalloc(&dev_grid, host_grid.size() * sizeof(Real)));
-    CudaSafeCall(cudaMemcpy(dev_grid, host_grid.data(), host_grid.size() * sizeof(Real), cudaMemcpyHostToDevice));
+    cuda_utilities::DeviceVector<Real> dev_grid(host_grid.size());
+    dev_grid.cpyHostToDevice(host_grid);
 
-    Real *dev_max_array;
-    CudaSafeCall(cudaMalloc(&dev_max_array, numBlocks*sizeof(Real)));
-    // Sets all bytes to 0.
-    cudaMemset(dev_max_array,0,numBlocks*sizeof(Real));
-    
-    Real host_max_array[numBlocks];
-    //Real *host_max_array = (Real *) malloc(numBlocks*sizeof(Real));
-    //CudaSafeCall( cudaHostAlloc(&host_max_array, numBlocks*sizeof(Real), cudaHostAllocDefault) );
 
+    cuda_utilities::DeviceVector<Real> static dev_max(1);
+    dev_max.assign(std::numeric_limits<double>::lowest());
 
     // Do the reduction
     // ================
-    hipLaunchKernelGGL(reduction_utilities::kernelReduceMax, numBlocks, threadsPerBlock, 0, 0, dev_grid, dev_max_array, host_grid.size());
+    hipLaunchKernelGGL(reduction_utilities::kernelReduceMax,
+                       launchParams.numBlocks, launchParams.threadsPerBlock, 0, 0,
+                       dev_grid.data(), dev_max.data(), host_grid.size());
     CudaCheckError();
 
-
-    // Copy back and sync
-    // ==================
-    CudaSafeCall(cudaMemcpy(&host_max_array, dev_max_array, numBlocks*sizeof(Real), cudaMemcpyDeviceToHost));
-    cudaDeviceSynchronize();
-
-    for (int i = 0; i < numBlocks; i++)
-    {
-        host_max = fmax(host_max,host_max_array[i]);
-    }
-
-    //free(host_max_array);
-
-    cudaFree(dev_max_array);
-
-    cudaFree(dev_grid);
-
     // Perform comparison
-    testingUtilities::checkResults(maxValue, host_max, "maximum value found");
+    testingUtilities::checkResults(maxValue, dev_max.at(0), "maximum value found");
 }
 // =============================================================================
 // Tests for divergence max reduction
diff --git a/src/utils/testing_utilities.cpp b/src/utils/testing_utilities.cpp
index 9b8bee948..6035b68b5 100644
--- a/src/utils/testing_utilities.cpp
+++ b/src/utils/testing_utilities.cpp
@@ -80,52 +80,6 @@ namespace testingUtilities
     }
     // =========================================================================
 
-    // =========================================================================
-    void checkResults(double fiducialNumber,
-                      double testNumber,
-                      std::string outString,
-                      double fixedEpsilon,
-                      int ulpsEpsilon)
-    {
-        // Check for equality and if not equal return difference
-        double absoluteDiff;
-        int64_t ulpsDiff;
-        bool areEqual;
-
-        if ((fixedEpsilon < 0) and (ulpsEpsilon < 0))
-        {
-            areEqual = testingUtilities::nearlyEqualDbl(fiducialNumber,
-                                                        testNumber,
-                                                        absoluteDiff,
-                                                        ulpsDiff);
-        }
-        else if ((fixedEpsilon > 0) and (ulpsEpsilon < 0))
-        {
-            areEqual = testingUtilities::nearlyEqualDbl(fiducialNumber,
-                                                        testNumber,
-                                                        absoluteDiff,
-                                                        ulpsDiff,
-                                                        fixedEpsilon);
-        }
-        else
-        {
-            areEqual = testingUtilities::nearlyEqualDbl(fiducialNumber,
-                                                        testNumber,
-                                                        absoluteDiff,
-                                                        ulpsDiff,
-                                                        fixedEpsilon,
-                                                        ulpsEpsilon);
-        }
-
-        EXPECT_TRUE(areEqual)
-            << "Difference in "                << outString       << std::endl
-            << "The fiducial value is:       " << fiducialNumber  << std::endl
-            << "The test value is:           " << testNumber      << std::endl
-            << "The absolute difference is:  " << absoluteDiff    << std::endl
-            << "The ULP difference is:       " << ulpsDiff        << std::endl;
-    }
-    // =========================================================================
-
   void wrapperEqual(int i, int j, int k, std::string dataSetName,
 		    double test_value, double fid_value, double fixedEpsilon=5.0E-12) {
 
@@ -139,24 +93,24 @@ namespace testingUtilities
     outString += k;
     outString += "]";
 
-    checkResults(fid_value,test_value,outString,fixedEpsilon);
+    ASSERT_NO_FATAL_FAILURE(checkResults<1>(fid_value,test_value,outString,fixedEpsilon));
   }
 
   void analyticConstant(systemTest::SystemTestRunner testObject, std::string dataSetName, double value) {
     std::vector<size_t> testDims(3,1);
     std::vector<double> testData = testObject.loadTestFieldData(dataSetName,testDims);
     for (size_t i = 0; i < testDims[0]; i++)
+    {
+      for (size_t j = 0; j < testDims[1]; j++)
       {
-	for (size_t j = 0; j < testDims[1]; j++)
-	  {
-	    for (size_t k = 0; k < testDims[2]; k++)
-	      {
-		size_t index = (i * testDims[1] * testDims[2]) + (j * testDims[2]) + k;
-
-		wrapperEqual(i,j,k,dataSetName,testData.at(index),value);
-	      }
-	  }
+        for (size_t k = 0; k < testDims[2]; k++)
+          {
+            size_t index = (i * testDims[1] * testDims[2]) + (j * testDims[2]) + k;
+
+            ASSERT_NO_FATAL_FAILURE(wrapperEqual(i,j,k,dataSetName,testData.at(index),value));
+          }
       }
+    }
   }
 
   void analyticSine(systemTest::SystemTestRunner testObject, std::string dataSetName,
@@ -166,17 +120,17 @@ namespace testingUtilities
     std::vector<size_t> testDims(3,1);
     std::vector<double> testData = testObject.loadTestFieldData(dataSetName,testDims);
     for (size_t i = 0; i < testDims[0]; i++)
-      {
-	for (size_t j = 0; j < testDims[1]; j++)
-	  {
-	    for (size_t k = 0; k < testDims[2]; k++)
-	      {
-		double value = constant + amplitude*std::sin(kx*i+ky*j+kz*k+phase);
-		size_t index = (i * testDims[1] * testDims[2]) + (j * testDims[2]) + k;
-		wrapperEqual(i,j,k,dataSetName,testData.at(index),value,tolerance);
-	      }
-	  }
-      }
+    {
+      for (size_t j = 0; j < testDims[1]; j++)
+        {
+          for (size_t k = 0; k < testDims[2]; k++)
+            {
+              double value = constant + amplitude*std::sin(kx*i+ky*j+kz*k+phase);
+              size_t index = (i * testDims[1] * testDims[2]) + (j * testDims[2]) + k;
+              ASSERT_NO_FATAL_FAILURE(wrapperEqual(i,j,k,dataSetName,testData.at(index),value,tolerance));
+            }
+        }
+    }
   }
 
 
diff --git a/src/utils/testing_utilities.h b/src/utils/testing_utilities.h
index 927a61f28..b98780247 100644
--- a/src/utils/testing_utilities.h
+++ b/src/utils/testing_utilities.h
@@ -10,6 +10,10 @@
 
 // STL includes
 #include <string>
+#include <sstream>
+#include <limits>
+#include <iomanip>
+
 #include "../system_tests/system_tester.h" // provide systemTest class
 
 // =============================================================================
@@ -106,6 +110,8 @@ namespace testingUtilities
      * \brief A simple function to compare two doubles with the nearlyEqualDbl
      * function, perform a GTest assert on the result, and print out the values
      *
+     * \tparam checkType The type of GTest assertion to use. "0" for and
+     * "EXPECT" and "1" for an "ASSERT"
      * \param[in] fiducialNumber The fiducial number to test against
      * \param[in] testNumber The unverified number to test
      * \param[in] outString A string to be printed in the first line of the output
@@ -115,11 +121,66 @@ namespace testingUtilities
      * \param[in] ulpsEpsilon The ULP epsilon to use in the comparison. Negative
      * values are ignored and default behaviour is used
      */
+    template<int checkType = 0>
     void checkResults(double fiducialNumber,
                       double testNumber,
                       std::string outString,
                       double fixedEpsilon = -999,
-                      int ulpsEpsilon = -999);
+                      int ulpsEpsilon = -999)
+    {
+        // Check for equality and if not equal return difference
+        double absoluteDiff;
+        int64_t ulpsDiff;
+        bool areEqual;
+
+        if ((fixedEpsilon < 0) and (ulpsEpsilon < 0))
+        {
+            areEqual = testingUtilities::nearlyEqualDbl(fiducialNumber,
+                                                        testNumber,
+                                                        absoluteDiff,
+                                                        ulpsDiff);
+        }
+        else if ((fixedEpsilon > 0) and (ulpsEpsilon < 0))
+        {
+            areEqual = testingUtilities::nearlyEqualDbl(fiducialNumber,
+                                                        testNumber,
+                                                        absoluteDiff,
+                                                        ulpsDiff,
+                                                        fixedEpsilon);
+        }
+        else
+        {
+            areEqual = testingUtilities::nearlyEqualDbl(fiducialNumber,
+                                                        testNumber,
+                                                        absoluteDiff,
+                                                        ulpsDiff,
+                                                        fixedEpsilon,
+                                                        ulpsEpsilon);
+        }
+
+        std::stringstream outputMessage;
+        outputMessage << std::setprecision(std::numeric_limits<double>::max_digits10)
+                      << "Difference in "                << outString       << std::endl
+                      << "The fiducial value is:       " << fiducialNumber  << std::endl
+                      << "The test value is:           " << testNumber      << std::endl
+                      << "The absolute difference is:  " << absoluteDiff    << std::endl
+                      << "The ULP difference is:       " << ulpsDiff        << std::endl;
+
+        if (checkType == 0)
+        {
+          EXPECT_TRUE(areEqual) << outputMessage.str();
+        }
+        else if (checkType == 1)
+        {
+          ASSERT_TRUE(areEqual) << outputMessage.str();
+        }
+        else
+        {
+          throw std::runtime_error("Incorrect template argument passed to "
+                                   "checkResults. Options are 0 and 1 but "
+                                   + std::to_string(checkType) + " was passed");
+        }
+    }
     // =========================================================================
 
     // =========================================================================

From 0c0952942f539d3b6a56a810cf353f5dbd690bd9 Mon Sep 17 00:00:00 2001
From: Bob Caddy <r.Caddy@pitt.edu>
Date: Tue, 20 Dec 2022 16:08:14 -0500
Subject: [PATCH 02/18] Replace MHD indexing with grid_enums

---
 src/grid/grid3D.cpp                    | 12 ++++-----
 src/grid/grid_enum.h                   | 28 +++++++++++++++++---
 src/hydro/hydro_cuda.cu                | 12 ++++-----
 src/integrators/VL_3D_cuda.cu          | 27 ++++++++++---------
 src/mhd/ct_electric_fields.cu          | 36 +++++++++++++-------------
 src/mhd/ct_electric_fields.h           | 10 +++----
 src/mhd/ct_electric_fields_tests.cu    |  6 ++---
 src/mhd/magnetic_divergence.cu         | 12 ++++-----
 src/mhd/magnetic_update.cu             |  6 ++---
 src/reconstruction/pcm_cuda.cu         | 24 ++++++++---------
 src/riemann_solvers/hlld_cuda.cu       | 13 +++++-----
 src/riemann_solvers/hlld_cuda_tests.cu | 32 +++++++++++------------
 src/utils/mhd_utilities.h              | 12 ++++-----
 13 files changed, 126 insertions(+), 104 deletions(-)

diff --git a/src/grid/grid3D.cpp b/src/grid/grid3D.cpp
index cadcb3653..bd67e87e6 100644
--- a/src/grid/grid3D.cpp
+++ b/src/grid/grid3D.cpp
@@ -299,9 +299,9 @@ void Grid3D::AllocateMemory(void)
   #endif
   #endif  //SCALAR
   #ifdef  MHD
-  C.magnetic_x = &(C.host[(5 + NSCALARS)*H.n_cells]);
-  C.magnetic_y = &(C.host[(6 + NSCALARS)*H.n_cells]);
-  C.magnetic_z = &(C.host[(7 + NSCALARS)*H.n_cells]);
+  C.magnetic_x = &(C.host[(grid_enum::magnetic_x)*H.n_cells]);
+  C.magnetic_y = &(C.host[(grid_enum::magnetic_y)*H.n_cells]);
+  C.magnetic_z = &(C.host[(grid_enum::magnetic_z)*H.n_cells]);
   #endif  //MHD
   #ifdef DE
   C.GasEnergy = &(C.host[(H.n_fields-1)*H.n_cells]);
@@ -322,9 +322,9 @@ void Grid3D::AllocateMemory(void)
   #endif
   #endif  // SCALAR
   #ifdef  MHD
-  C.d_magnetic_x   = &(C.device[(5 + NSCALARS)*H.n_cells]);
-  C.d_magnetic_y   = &(C.device[(6 + NSCALARS)*H.n_cells]);
-  C.d_magnetic_z   = &(C.device[(7 + NSCALARS)*H.n_cells]);
+  C.d_magnetic_x   = &(C.device[(grid_enum::magnetic_x)*H.n_cells]);
+  C.d_magnetic_y   = &(C.device[(grid_enum::magnetic_y)*H.n_cells]);
+  C.d_magnetic_z   = &(C.device[(grid_enum::magnetic_z)*H.n_cells]);
   #endif  //MHD
   #ifdef DE
   C.d_GasEnergy  = &(C.device[(H.n_fields-1)*H.n_cells]);
diff --git a/src/grid/grid_enum.h b/src/grid/grid_enum.h
index 6f25676dd..315533f5d 100644
--- a/src/grid/grid_enum.h
+++ b/src/grid/grid_enum.h
@@ -2,8 +2,8 @@
 
 // An enum which holds offsets for grid quantities
 // In the final form of this approach, this file will also set nfields (not yet) and NSCALARS (done)
-// so that adding a field only requires registering it here: 
-// grid knows to allocate memory based on nfields and NSCALARS 
+// so that adding a field only requires registering it here:
+// grid knows to allocate memory based on nfields and NSCALARS
 // and values can be accessed with density[id + ncells*grid_enum::enum_name]
 // example: C.device[id + H.n_cells*grid_enum::basic_scalar]
 
@@ -55,7 +55,7 @@ enum : int {
   #endif // SCALAR
 
   finalscalar_plus_1, // needed to calculate NSCALARS
-  finalscalar = finalscalar_plus_1 - 1, // resets enum to finalscalar so fields afterwards are correct  
+  finalscalar = finalscalar_plus_1 - 1, // resets enum to finalscalar so fields afterwards are correct
   // so that anything after starts with scalar + NSCALARS
 
   #ifdef MHD
@@ -69,7 +69,29 @@ enum : int {
   num_fields,
 
 //Aliases and manually computed enums
+  #ifdef  MHD
+  num_flux_fields = num_fields-1,
+  num_interface_fields = num_fields-1,
+  #else
+  num_flux_fields = num_fields,
+  num_interface_fields = num_fields,
+  #endif  //MHD
   nscalars = finalscalar_plus_1 - scalar,
+  magnetic_start = magnetic_x,
+  magnetic_end   = magnetic_z,
+  // Note that the direction of the flux, the suffix _? indicates the direction of the electric field, not the magnetic flux
+  fluxX_magnetic_z = magnetic_start,
+  fluxX_magnetic_y = magnetic_start+1,
+  fluxY_magnetic_x = magnetic_start,
+  fluxY_magnetic_z = magnetic_start+1,
+  fluxZ_magnetic_y = magnetic_start,
+  fluxZ_magnetic_x = magnetic_start+1,
+  Q_x_magnetic_y = magnetic_start,
+  Q_x_magnetic_z = magnetic_start+1,
+  Q_y_magnetic_z = magnetic_start,
+  Q_y_magnetic_x = magnetic_start+1,
+  Q_z_magnetic_x = magnetic_start,
+  Q_z_magnetic_y = magnetic_start+1
 
 };
 }
diff --git a/src/hydro/hydro_cuda.cu b/src/hydro/hydro_cuda.cu
index c9fa2b682..add8af96a 100644
--- a/src/hydro/hydro_cuda.cu
+++ b/src/hydro/hydro_cuda.cu
@@ -1193,12 +1193,12 @@ __device__ void Average_Cell_All_Fields( int i, int j, int k, int nx, int ny, in
   Average_Cell_Single_Field( 4, i, j, k, nx, ny, nz, ncells, conserved );
   #ifdef  MHD
     // Average MHD
-    Average_Cell_Single_Field( 5+NSCALARS, i,   j,   k,   nx, ny, nz, ncells, conserved );
-    Average_Cell_Single_Field( 6+NSCALARS, i,   j,   k,   nx, ny, nz, ncells, conserved );
-    Average_Cell_Single_Field( 7+NSCALARS, i,   j,   k,   nx, ny, nz, ncells, conserved );
-    Average_Cell_Single_Field( 5+NSCALARS, i-1, j,   k,   nx, ny, nz, ncells, conserved );
-    Average_Cell_Single_Field( 6+NSCALARS, i,   j-1, k,   nx, ny, nz, ncells, conserved );
-    Average_Cell_Single_Field( 7+NSCALARS, i,   j,   k-1, nx, ny, nz, ncells, conserved );
+    Average_Cell_Single_Field( grid_enum::magnetic_x, i,   j,   k,   nx, ny, nz, ncells, conserved );
+    Average_Cell_Single_Field( grid_enum::magnetic_y, i,   j,   k,   nx, ny, nz, ncells, conserved );
+    Average_Cell_Single_Field( grid_enum::magnetic_z, i,   j,   k,   nx, ny, nz, ncells, conserved );
+    Average_Cell_Single_Field( grid_enum::magnetic_x, i-1, j,   k,   nx, ny, nz, ncells, conserved );
+    Average_Cell_Single_Field( grid_enum::magnetic_y, i,   j-1, k,   nx, ny, nz, ncells, conserved );
+    Average_Cell_Single_Field( grid_enum::magnetic_z, i,   j,   k-1, nx, ny, nz, ncells, conserved );
   #endif  //MHD
   #ifdef DE
   // Average GasEnergy
diff --git a/src/integrators/VL_3D_cuda.cu b/src/integrators/VL_3D_cuda.cu
index 2d23cc636..1f9a6a459 100644
--- a/src/integrators/VL_3D_cuda.cu
+++ b/src/integrators/VL_3D_cuda.cu
@@ -67,8 +67,7 @@ void VL_Algorithm_3D_CUDA(Real *d_conserved, Real *d_grav_potential, int nx, int
       // `Q_Lx` interface store the reconstructed Y and Z magnetic fields in
       // that order, the `Q_Ly` interface stores the Z and X mangetic fields in
       // that order, and the `Q_Lz` interface stores the X and Y magnetic fields
-      // in that order. These fields start at the (5+NSCALARS)*n_cells and
-      // (6+NSCALARS)*n_cells locations respectively. The interface state arrays
+      // in that order. These fields can be indexed with the Q_?_dir grid_enums. The interface state arrays
       // store in the interface on the "right" side of the cell, so the flux
       // arrays store the fluxes through the right interface
       //
@@ -77,12 +76,12 @@ void VL_Algorithm_3D_CUDA(Real *d_conserved, Real *d_grav_potential, int nx, int
       // -cross(V,B)x is the negative of the x-component of V cross B. Note that
       // "X" is the direction the solver is running in this case, not
       // necessarily the true "X".
-      //  F_x[(5+NSCALARS)*n_cells] = VxBy - BxVy = -(-cross(V,B))z = -EMF_Z
-      //  F_x[(6+NSCALARS)*n_cells] = VxBz - BxVz =  (-cross(V,B))y =  EMF_Y
-      //  F_y[(5+NSCALARS)*n_cells] = VxBy - BxVy = -(-cross(V,B))z = -EMF_X
-      //  F_y[(6+NSCALARS)*n_cells] = VxBz - BxVz =  (-cross(V,B))y =  EMF_Z
-      //  F_z[(5+NSCALARS)*n_cells] = VxBy - BxVy = -(-cross(V,B))z = -EMF_Y
-      //  F_z[(6+NSCALARS)*n_cells] = VxBz - BxVz =  (-cross(V,B))y =  EMF_X
+      //  F_x[(grid_enum::fluxX_magnetic_z)*n_cells] = VxBy - BxVy = -(-cross(V,B))z = -EMF_Z
+      //  F_x[(grid_enum::fluxX_magnetic_y)*n_cells] = VxBz - BxVz =  (-cross(V,B))y =  EMF_Y
+      //  F_y[(grid_enum::fluxY_magnetic_x)*n_cells] = VxBy - BxVy = -(-cross(V,B))z = -EMF_X
+      //  F_y[(grid_enum::fluxY_magnetic_z)*n_cells] = VxBz - BxVz =  (-cross(V,B))y =  EMF_Z
+      //  F_z[(grid_enum::fluxZ_magnetic_y)*n_cells] = VxBy - BxVy = -(-cross(V,B))z = -EMF_Y
+      //  F_z[(grid_enum::fluxZ_magnetic_x)*n_cells] = VxBz - BxVz =  (-cross(V,B))y =  EMF_X
       size_t const arraySize   = (n_fields-1) * n_cells * sizeof(Real);
       size_t const ctArraySize =            3 * n_cells * sizeof(Real);
     #else  // not MHD
@@ -157,9 +156,9 @@ void VL_Algorithm_3D_CUDA(Real *d_conserved, Real *d_grav_potential, int nx, int
     hipLaunchKernelGGL(Calculate_HLL_Fluxes_CUDA, dim1dGrid, dim1dBlock, 0, 0, Q_Lz, Q_Rz, F_z, nx, ny, nz, n_ghost, gama, 2, n_fields);
     #endif //HLL
     #ifdef HLLD
-    hipLaunchKernelGGL(mhd::Calculate_HLLD_Fluxes_CUDA, dim1dGrid, dim1dBlock, 0, 0, Q_Lx, Q_Rx, &(dev_conserved[(5 + NSCALARS) * n_cells]), F_x, nx, ny, nz, n_ghost, gama, 0, n_fields);
-    hipLaunchKernelGGL(mhd::Calculate_HLLD_Fluxes_CUDA, dim1dGrid, dim1dBlock, 0, 0, Q_Ly, Q_Ry, &(dev_conserved[(6 + NSCALARS) * n_cells]), F_y, nx, ny, nz, n_ghost, gama, 1, n_fields);
-    hipLaunchKernelGGL(mhd::Calculate_HLLD_Fluxes_CUDA, dim1dGrid, dim1dBlock, 0, 0, Q_Lz, Q_Rz, &(dev_conserved[(7 + NSCALARS) * n_cells]), F_z, nx, ny, nz, n_ghost, gama, 2, n_fields);
+    hipLaunchKernelGGL(mhd::Calculate_HLLD_Fluxes_CUDA, dim1dGrid, dim1dBlock, 0, 0, Q_Lx, Q_Rx, &(dev_conserved[(grid_enum::magnetic_x) * n_cells]), F_x, nx, ny, nz, n_ghost, gama, 0, n_fields);
+    hipLaunchKernelGGL(mhd::Calculate_HLLD_Fluxes_CUDA, dim1dGrid, dim1dBlock, 0, 0, Q_Ly, Q_Ry, &(dev_conserved[(grid_enum::magnetic_y) * n_cells]), F_y, nx, ny, nz, n_ghost, gama, 1, n_fields);
+    hipLaunchKernelGGL(mhd::Calculate_HLLD_Fluxes_CUDA, dim1dGrid, dim1dBlock, 0, 0, Q_Lz, Q_Rz, &(dev_conserved[(grid_enum::magnetic_z) * n_cells]), F_z, nx, ny, nz, n_ghost, gama, 2, n_fields);
     #endif //HLLD
     CudaCheckError();
 
@@ -227,9 +226,9 @@ void VL_Algorithm_3D_CUDA(Real *d_conserved, Real *d_grav_potential, int nx, int
     hipLaunchKernelGGL(Calculate_HLL_Fluxes_CUDA, dim1dGrid, dim1dBlock, 0, 0, Q_Lz, Q_Rz, F_z, nx, ny, nz, n_ghost, gama, 2, n_fields);
     #endif //HLLC
     #ifdef HLLD
-    hipLaunchKernelGGL(mhd::Calculate_HLLD_Fluxes_CUDA, dim1dGrid, dim1dBlock, 0, 0, Q_Lx, Q_Rx, &(dev_conserved_half[(5 + NSCALARS) * n_cells]), F_x, nx, ny, nz, n_ghost, gama, 0, n_fields);
-    hipLaunchKernelGGL(mhd::Calculate_HLLD_Fluxes_CUDA, dim1dGrid, dim1dBlock, 0, 0, Q_Ly, Q_Ry, &(dev_conserved_half[(6 + NSCALARS) * n_cells]), F_y, nx, ny, nz, n_ghost, gama, 1, n_fields);
-    hipLaunchKernelGGL(mhd::Calculate_HLLD_Fluxes_CUDA, dim1dGrid, dim1dBlock, 0, 0, Q_Lz, Q_Rz, &(dev_conserved_half[(7 + NSCALARS) * n_cells]), F_z, nx, ny, nz, n_ghost, gama, 2, n_fields);
+    hipLaunchKernelGGL(mhd::Calculate_HLLD_Fluxes_CUDA, dim1dGrid, dim1dBlock, 0, 0, Q_Lx, Q_Rx, &(dev_conserved_half[(grid_enum::magnetic_x) * n_cells]), F_x, nx, ny, nz, n_ghost, gama, 0, n_fields);
+    hipLaunchKernelGGL(mhd::Calculate_HLLD_Fluxes_CUDA, dim1dGrid, dim1dBlock, 0, 0, Q_Ly, Q_Ry, &(dev_conserved_half[(grid_enum::magnetic_y) * n_cells]), F_y, nx, ny, nz, n_ghost, gama, 1, n_fields);
+    hipLaunchKernelGGL(mhd::Calculate_HLLD_Fluxes_CUDA, dim1dGrid, dim1dBlock, 0, 0, Q_Lz, Q_Rz, &(dev_conserved_half[(grid_enum::magnetic_z) * n_cells]), F_z, nx, ny, nz, n_ghost, gama, 2, n_fields);
     #endif //HLLD
     CudaCheckError();
 
diff --git a/src/mhd/ct_electric_fields.cu b/src/mhd/ct_electric_fields.cu
index 64a17bf52..310da1be2 100644
--- a/src/mhd/ct_electric_fields.cu
+++ b/src/mhd/ct_electric_fields.cu
@@ -44,12 +44,12 @@ namespace mhd
             // fields/EMF. -cross(V,B)x is the negative of the x-component of V
             // cross B. Note that "X" is the direction the solver is running in
             // this case, not necessarily the true "X".
-            //  F_x[(5+NSCALARS)*n_cells] = VxBy - BxVy = -(-cross(V,B))z = -EMF_Z
-            //  F_x[(6+NSCALARS)*n_cells] = VxBz - BxVz =  (-cross(V,B))y =  EMF_Y
-            //  F_y[(5+NSCALARS)*n_cells] = VxBy - BxVy = -(-cross(V,B))z = -EMF_X
-            //  F_y[(6+NSCALARS)*n_cells] = VxBz - BxVz =  (-cross(V,B))y =  EMF_Z
-            //  F_z[(5+NSCALARS)*n_cells] = VxBy - BxVy = -(-cross(V,B))z = -EMF_Y
-            //  F_z[(6+NSCALARS)*n_cells] = VxBz - BxVz =  (-cross(V,B))y =  EMF_X
+            //  F_x[(grid_enum::fluxX_magnetic_z)*n_cells] = VxBy - BxVy = -(-cross(V,B))z = -EMF_Z
+            //  F_x[(grid_enum::fluxX_magnetic_y)*n_cells] = VxBz - BxVz =  (-cross(V,B))y =  EMF_Y
+            //  F_y[(grid_enum::fluxY_magnetic_x)*n_cells] = VxBy - BxVy = -(-cross(V,B))z = -EMF_X
+            //  F_y[(grid_enum::fluxY_magnetic_z)*n_cells] = VxBz - BxVz =  (-cross(V,B))y =  EMF_Z
+            //  F_z[(grid_enum::fluxZ_magnetic_y)*n_cells] = VxBy - BxVy = -(-cross(V,B))z = -EMF_Y
+            //  F_z[(grid_enum::fluxZ_magnetic_x)*n_cells] = VxBz - BxVz =  (-cross(V,B))y =  EMF_X
 
             // Notes on Implementation Details
             // - The density flux has the same sign as the velocity on the face
@@ -147,10 +147,10 @@ namespace mhd
             // Load the face centered electric fields  Note the negative signs to
             // convert from magnetic flux to electric field
 
-            face_y_pos = + fluxZ[cuda_utilities::compute1DIndex(xid  , yid  , zid-1, nx, ny) + (6+NSCALARS)*n_cells];
-            face_y_neg = + fluxZ[cuda_utilities::compute1DIndex(xid  , yid-1, zid-1, nx, ny) + (6+NSCALARS)*n_cells];
-            face_z_pos = - fluxY[cuda_utilities::compute1DIndex(xid  , yid-1, zid  , nx, ny) + (5+NSCALARS)*n_cells];
-            face_z_neg = - fluxY[cuda_utilities::compute1DIndex(xid  , yid-1, zid-1, nx, ny) + (5+NSCALARS)*n_cells];
+            face_y_pos = + fluxZ[cuda_utilities::compute1DIndex(xid  , yid  , zid-1, nx, ny) + (grid_enum::fluxZ_magnetic_x)*n_cells];
+            face_y_neg = + fluxZ[cuda_utilities::compute1DIndex(xid  , yid-1, zid-1, nx, ny) + (grid_enum::fluxZ_magnetic_x)*n_cells];
+            face_z_pos = - fluxY[cuda_utilities::compute1DIndex(xid  , yid-1, zid  , nx, ny) + (grid_enum::fluxY_magnetic_x)*n_cells];
+            face_z_neg = - fluxY[cuda_utilities::compute1DIndex(xid  , yid-1, zid-1, nx, ny) + (grid_enum::fluxY_magnetic_x)*n_cells];
 
             // sum and average face centered electric fields and slopes to get the
             // edge averaged electric field.
@@ -233,10 +233,10 @@ namespace mhd
 
             // Load the face centered electric fields  Note the negative signs to
             // convert from magnetic flux to electric field
-            face_x_pos = - fluxZ[cuda_utilities::compute1DIndex(xid  , yid, zid-1, nx, ny) + (5+NSCALARS)*n_cells];
-            face_x_neg = - fluxZ[cuda_utilities::compute1DIndex(xid-1, yid, zid-1, nx, ny) + (5+NSCALARS)*n_cells];
-            face_z_pos = + fluxX[cuda_utilities::compute1DIndex(xid-1, yid, zid  , nx, ny) + (6+NSCALARS)*n_cells];
-            face_z_neg = + fluxX[cuda_utilities::compute1DIndex(xid-1, yid, zid-1, nx, ny) + (6+NSCALARS)*n_cells];
+            face_x_pos = - fluxZ[cuda_utilities::compute1DIndex(xid  , yid, zid-1, nx, ny) + (grid_enum::fluxZ_magnetic_y)*n_cells];
+            face_x_neg = - fluxZ[cuda_utilities::compute1DIndex(xid-1, yid, zid-1, nx, ny) + (grid_enum::fluxZ_magnetic_y)*n_cells];
+            face_z_pos = + fluxX[cuda_utilities::compute1DIndex(xid-1, yid, zid  , nx, ny) + (grid_enum::fluxX_magnetic_y)*n_cells];
+            face_z_neg = + fluxX[cuda_utilities::compute1DIndex(xid-1, yid, zid-1, nx, ny) + (grid_enum::fluxX_magnetic_y)*n_cells];
 
             // sum and average face centered electric fields and slopes to get the
             // edge averaged electric field.
@@ -319,10 +319,10 @@ namespace mhd
 
             // Load the face centered electric fields  Note the negative signs to
             // convert from magnetic flux to electric field
-            face_x_pos = + fluxY[cuda_utilities::compute1DIndex(xid  , yid-1, zid, nx, ny) + (6+NSCALARS)*n_cells];
-            face_x_neg = + fluxY[cuda_utilities::compute1DIndex(xid-1, yid-1, zid, nx, ny) + (6+NSCALARS)*n_cells];
-            face_y_pos = - fluxX[cuda_utilities::compute1DIndex(xid-1, yid  , zid, nx, ny) + (5+NSCALARS)*n_cells];
-            face_y_neg = - fluxX[cuda_utilities::compute1DIndex(xid-1, yid-1, zid, nx, ny) + (5+NSCALARS)*n_cells];
+            face_x_pos = + fluxY[cuda_utilities::compute1DIndex(xid  , yid-1, zid, nx, ny) + (grid_enum::fluxY_magnetic_z)*n_cells];
+            face_x_neg = + fluxY[cuda_utilities::compute1DIndex(xid-1, yid-1, zid, nx, ny) + (grid_enum::fluxY_magnetic_z)*n_cells];
+            face_y_pos = - fluxX[cuda_utilities::compute1DIndex(xid-1, yid  , zid, nx, ny) + (grid_enum::fluxX_magnetic_z)*n_cells];
+            face_y_neg = - fluxX[cuda_utilities::compute1DIndex(xid-1, yid-1, zid, nx, ny) + (grid_enum::fluxX_magnetic_z)*n_cells];
 
             // sum and average face centered electric fields and slopes to get the
             // edge averaged electric field.
diff --git a/src/mhd/ct_electric_fields.h b/src/mhd/ct_electric_fields.h
index 987633461..9e122d0dd 100644
--- a/src/mhd/ct_electric_fields.h
+++ b/src/mhd/ct_electric_fields.h
@@ -107,10 +107,10 @@ namespace mhd
             Real const density    =          dev_conserved[idxCentered                                ];
             Real const Momentum2  =          dev_conserved[idxCentered + (modPlus1+1)         *n_cells];
             Real const Momentum3  =          dev_conserved[idxCentered + (modPlus2+1)         *n_cells];
-            Real const B2Centered = 0.5 * (  dev_conserved[idxCentered + (modPlus1+5+NSCALARS)*n_cells]
-                                           + dev_conserved[idxB2Shift  + (modPlus1+5+NSCALARS)*n_cells]);
-            Real const B3Centered = 0.5 * (  dev_conserved[idxCentered + (modPlus2+5+NSCALARS)*n_cells]
-                                           + dev_conserved[idxB3Shift  + (modPlus2+5+NSCALARS)*n_cells]);
+            Real const B2Centered = 0.5 * (  dev_conserved[idxCentered + (modPlus1+grid_enum::magnetic_start)*n_cells]
+                                           + dev_conserved[idxB2Shift  + (modPlus1+grid_enum::magnetic_start)*n_cells]);
+            Real const B3Centered = 0.5 * (  dev_conserved[idxCentered + (modPlus2+grid_enum::magnetic_start)*n_cells]
+                                           + dev_conserved[idxB3Shift  + (modPlus2+grid_enum::magnetic_start)*n_cells]);
 
             // Compute the electric field in the center with a cross product
             Real const electric_centered = (Momentum3*B2Centered - Momentum2*B3Centered) / density;
@@ -118,7 +118,7 @@ namespace mhd
             // Load face centered electric field, note fluxSign to correctly do
             // the shift from magnetic flux to EMF/electric field and to choose
             // which field to use
-            Real const electric_face = fluxSign * flux[idxFlux + (int(fluxSign == 1)+5+NSCALARS)*n_cells];
+            Real const electric_face = fluxSign * flux[idxFlux + (int(fluxSign == 1)+grid_enum::magnetic_start)*n_cells];
 
             // Compute the slope and return it
             return electric_face - electric_centered;
diff --git a/src/mhd/ct_electric_fields_tests.cu b/src/mhd/ct_electric_fields_tests.cu
index 55b46f3c8..becbe2afa 100644
--- a/src/mhd/ct_electric_fields_tests.cu
+++ b/src/mhd/ct_electric_fields_tests.cu
@@ -44,9 +44,9 @@ public:
         ny(nx),
         nz(nx),
         n_cells(nx*ny*nz),
-        fluxX(n_cells * (7+NSCALARS)),
-        fluxY(n_cells * (7+NSCALARS)),
-        fluxZ(n_cells * (7+NSCALARS)),
+        fluxX(n_cells * (grid_enum::num_flux_fields)),
+        fluxY(n_cells * (grid_enum::num_flux_fields)),
+        fluxZ(n_cells * (grid_enum::num_flux_fields)),
         grid (n_cells * (8+NSCALARS)),
         testCTElectricFields(n_cells * 3, -999.),
         fiducialData(n_cells * 3, -999.),
diff --git a/src/mhd/magnetic_divergence.cu b/src/mhd/magnetic_divergence.cu
index 02051e48c..0d8bf90a1 100644
--- a/src/mhd/magnetic_divergence.cu
+++ b/src/mhd/magnetic_divergence.cu
@@ -59,14 +59,14 @@ namespace mhd
 
                 // Compute divergence
                 cellDivergence =
-                    ((   dev_conserved[id       + (5+NSCALARS)*n_cells]
-                       - dev_conserved[id_xMin1 + (5+NSCALARS)*n_cells])
+                    ((   dev_conserved[id       + (grid_enum::magnetic_x)*n_cells]
+                       - dev_conserved[id_xMin1 + (grid_enum::magnetic_x)*n_cells])
                     / dx)
-                    + (( dev_conserved[id       + (6+NSCALARS)*n_cells]
-                       - dev_conserved[id_yMin1 + (6+NSCALARS)*n_cells])
+                    + (( dev_conserved[id       + (grid_enum::magnetic_y)*n_cells]
+                       - dev_conserved[id_yMin1 + (grid_enum::magnetic_y)*n_cells])
                     / dy)
-                    + (( dev_conserved[id       + (7+NSCALARS)*n_cells]
-                       - dev_conserved[id_zMin1 + (7+NSCALARS)*n_cells])
+                    + (( dev_conserved[id       + (grid_enum::magnetic_z)*n_cells]
+                       - dev_conserved[id_zMin1 + (grid_enum::magnetic_z)*n_cells])
                     / dz);
 
                 maxDivergence = max(maxDivergence, fabs(cellDivergence));
diff --git a/src/mhd/magnetic_update.cu b/src/mhd/magnetic_update.cu
index 78f298e05..fb6a89fec 100644
--- a/src/mhd/magnetic_update.cu
+++ b/src/mhd/magnetic_update.cu
@@ -61,17 +61,17 @@ namespace mhd
             // Perform Updates
 
             // X field update
-            destinationGrid[threadId + (5+NSCALARS)*n_cells] = sourceGrid[threadId + (5+NSCALARS)*n_cells]
+            destinationGrid[threadId + (grid_enum::magnetic_x)*n_cells] = sourceGrid[threadId + (grid_enum::magnetic_x)*n_cells]
                 + dtodz * (electric_y_3 - electric_y_1)
                 + dtody * (electric_z_1 - electric_z_3);
 
             // Y field update
-            destinationGrid[threadId + (6+NSCALARS)*n_cells] = sourceGrid[threadId + (6+NSCALARS)*n_cells]
+            destinationGrid[threadId + (grid_enum::magnetic_y)*n_cells] = sourceGrid[threadId + (grid_enum::magnetic_y)*n_cells]
                 + dtodx * (electric_z_3 - electric_z_2)
                 + dtodz * (electric_x_1 - electric_x_3);
 
             // Z field update
-            destinationGrid[threadId + (7+NSCALARS)*n_cells] = sourceGrid[threadId + (7+NSCALARS)*n_cells]
+            destinationGrid[threadId + (grid_enum::magnetic_z)*n_cells] = sourceGrid[threadId + (grid_enum::magnetic_z)*n_cells]
                 + dtody * (electric_x_3 - electric_x_2)
                 + dtodx * (electric_y_2 - electric_y_3);
         }
diff --git a/src/reconstruction/pcm_cuda.cu b/src/reconstruction/pcm_cuda.cu
index 91fb75223..4998dcd92 100644
--- a/src/reconstruction/pcm_cuda.cu
+++ b/src/reconstruction/pcm_cuda.cu
@@ -325,8 +325,8 @@ __global__ void PCM_Reconstruction_3D(Real *dev_conserved,
       }
     #endif  //SCALAR
     #ifdef  MHD
-      dev_bounds_Lx[(5+NSCALARS)*n_cells + id] = cellCenteredBy;
-      dev_bounds_Lx[(6+NSCALARS)*n_cells + id] = cellCenteredBz;
+      dev_bounds_Lx[(grid_enum::Q_x_magnetic_y)*n_cells + id] = cellCenteredBy;
+      dev_bounds_Lx[(grid_enum::Q_x_magnetic_z)*n_cells + id] = cellCenteredBz;
     #endif  //MHD
     #ifdef DE
       dev_bounds_Lx[(n_fields-1)*n_cells + id] = ge;
@@ -345,8 +345,8 @@ __global__ void PCM_Reconstruction_3D(Real *dev_conserved,
       }
     #endif  //SCALAR
     #ifdef  MHD
-      dev_bounds_Ly[(5+NSCALARS)*n_cells + id] = cellCenteredBz;
-      dev_bounds_Ly[(6+NSCALARS)*n_cells + id] = cellCenteredBx;
+      dev_bounds_Ly[(grid_enum::Q_y_magnetic_z)*n_cells + id] = cellCenteredBz;
+      dev_bounds_Ly[(grid_enum::Q_y_magnetic_x)*n_cells + id] = cellCenteredBx;
     #endif  //MHD
     #ifdef DE
       dev_bounds_Ly[(n_fields-1)*n_cells + id] = ge;
@@ -365,8 +365,8 @@ __global__ void PCM_Reconstruction_3D(Real *dev_conserved,
       }
     #endif  //SCALAR
     #ifdef  MHD
-      dev_bounds_Lz[(5+NSCALARS)*n_cells + id] = cellCenteredBx;
-      dev_bounds_Lz[(6+NSCALARS)*n_cells + id] = cellCenteredBy;
+      dev_bounds_Lz[(grid_enum::Q_z_magnetic_x)*n_cells + id] = cellCenteredBx;
+      dev_bounds_Lz[(grid_enum::Q_z_magnetic_y)*n_cells + id] = cellCenteredBy;
     #endif  //MHD
     #ifdef DE
       dev_bounds_Lz[(n_fields-1)*n_cells + id] = ge;
@@ -388,8 +388,8 @@ __global__ void PCM_Reconstruction_3D(Real *dev_conserved,
         }
       #endif  //SCALAR
       #ifdef  MHD
-        dev_bounds_Rx[(5+NSCALARS)*n_cells + id] = cellCenteredBy;
-        dev_bounds_Rx[(6+NSCALARS)*n_cells + id] = cellCenteredBz;
+        dev_bounds_Rx[(grid_enum::Q_x_magnetic_y)*n_cells + id] = cellCenteredBy;
+        dev_bounds_Rx[(grid_enum::Q_x_magnetic_z)*n_cells + id] = cellCenteredBz;
       #endif  //MHD
       #ifdef DE
         dev_bounds_Rx[(n_fields-1)*n_cells + id] = ge;
@@ -412,8 +412,8 @@ __global__ void PCM_Reconstruction_3D(Real *dev_conserved,
         }
       #endif  //SCALAR
       #ifdef  MHD
-        dev_bounds_Ry[(5+NSCALARS)*n_cells + id] = cellCenteredBz;
-        dev_bounds_Ry[(6+NSCALARS)*n_cells + id] = cellCenteredBx;
+        dev_bounds_Ry[(grid_enum::Q_y_magnetic_z)*n_cells + id] = cellCenteredBz;
+        dev_bounds_Ry[(grid_enum::Q_y_magnetic_x)*n_cells + id] = cellCenteredBx;
       #endif  //MHD
       #ifdef DE
         dev_bounds_Ry[(n_fields-1)*n_cells + id] = ge;
@@ -436,8 +436,8 @@ __global__ void PCM_Reconstruction_3D(Real *dev_conserved,
         }
       #endif  //SCALAR
       #ifdef  MHD
-        dev_bounds_Rz[(5+NSCALARS)*n_cells + id] = cellCenteredBx;
-        dev_bounds_Rz[(6+NSCALARS)*n_cells + id] = cellCenteredBy;
+        dev_bounds_Rz[(grid_enum::Q_z_magnetic_x)*n_cells + id] = cellCenteredBx;
+        dev_bounds_Rz[(grid_enum::Q_z_magnetic_y)*n_cells + id] = cellCenteredBy;
       #endif  //MHD
       #ifdef DE
         dev_bounds_Rz[(n_fields-1)*n_cells + id] = ge;
diff --git a/src/riemann_solvers/hlld_cuda.cu b/src/riemann_solvers/hlld_cuda.cu
index ca20fdb1f..18fe8578e 100644
--- a/src/riemann_solvers/hlld_cuda.cu
+++ b/src/riemann_solvers/hlld_cuda.cu
@@ -16,6 +16,7 @@
 #include "../riemann_solvers/hlld_cuda.h"
 #include "../utils/cuda_utilities.h"
 #include "../utils/math_utilities.h"
+#include "../grid/grid_enum.h"
 
 #ifdef DE //PRESSURE_DE
     #include "../utils/hydro_utilities.h"
@@ -73,8 +74,8 @@ namespace mhd
             Real momentumYL = dev_bounds_L[threadId + n_cells * o2];
             Real momentumZL = dev_bounds_L[threadId + n_cells * o3];
             Real energyL    = dev_bounds_L[threadId + n_cells * 4];
-            Real magneticYL = dev_bounds_L[threadId + n_cells * (5 + NSCALARS)];
-            Real magneticZL = dev_bounds_L[threadId + n_cells * (6 + NSCALARS)];
+            Real magneticYL = dev_bounds_L[threadId + n_cells * (grid_enum::Q_x_magnetic_y)];
+            Real magneticZL = dev_bounds_L[threadId + n_cells * (grid_enum::Q_x_magnetic_z)];
 
             #ifdef SCALAR
                 Real scalarConservedL[NSCALARS];
@@ -93,8 +94,8 @@ namespace mhd
             Real momentumYR = dev_bounds_R[threadId + n_cells * o2];
             Real momentumZR = dev_bounds_R[threadId + n_cells * o3];
             Real energyR    = dev_bounds_R[threadId + n_cells * 4];
-            Real magneticYR = dev_bounds_R[threadId + n_cells * (5 + NSCALARS)];
-            Real magneticZR = dev_bounds_R[threadId + n_cells * (6 + NSCALARS)];
+            Real magneticYR = dev_bounds_R[threadId + n_cells * (grid_enum::Q_x_magnetic_y)];
+            Real magneticZR = dev_bounds_R[threadId + n_cells * (grid_enum::Q_x_magnetic_z)];
 
             #ifdef SCALAR
                 Real scalarConservedR[NSCALARS];
@@ -706,8 +707,8 @@ namespace mhd
             dev_flux[threadId + n_cells * o2]             = momentumFluxY;
             dev_flux[threadId + n_cells * o3]             = momentumFluxZ;
             dev_flux[threadId + n_cells * 4]              = energyFlux;
-            dev_flux[threadId + n_cells * (5 + NSCALARS)] = magneticFluxY;
-            dev_flux[threadId + n_cells * (6 + NSCALARS)] = magneticFluxZ;
+            dev_flux[threadId + n_cells * (grid_enum::fluxX_magnetic_z)] = magneticFluxY;
+            dev_flux[threadId + n_cells * (grid_enum::fluxX_magnetic_y)] = magneticFluxZ;
         }
         // =====================================================================
 
diff --git a/src/riemann_solvers/hlld_cuda_tests.cu b/src/riemann_solvers/hlld_cuda_tests.cu
index c39116d7a..ad4ac1547 100644
--- a/src/riemann_solvers/hlld_cuda_tests.cu
+++ b/src/riemann_solvers/hlld_cuda_tests.cu
@@ -16,6 +16,7 @@
 
 // Local Includes
 #include "../global/global_cuda.h"
+#include "../grid/grid_enum.h"
 #include "../utils/gpu.hpp"
 #include "../utils/testing_utilities.h"
 #include "../utils/mhd_utilities.h"
@@ -65,12 +66,11 @@
 
             // Create new vectors that store the values in the way that the HLLD
             // solver expects
-            size_t const magXIndex = 5+NSCALARS;
-            EXPECT_DOUBLE_EQ(stateLeft.at(magXIndex), stateRight.at(magXIndex))
+            EXPECT_DOUBLE_EQ(stateLeft.at(grid_enum::magnetic_x), stateRight.at(grid_enum::magnetic_x))
                 << "The left and right magnetic fields are not equal";
-            std::vector<Real> const magneticX{stateLeft.at(magXIndex)};
-            stateLeft.erase(stateLeft.begin() + magXIndex);
-            stateRight.erase(stateRight.begin() + magXIndex);
+            std::vector<Real> const magneticX{stateLeft.at(grid_enum::magnetic_x)};
+            stateLeft.erase(stateLeft.begin() + grid_enum::magnetic_x);
+            stateRight.erase(stateRight.begin() + grid_enum::magnetic_x);
 
             // Simulation Paramters
             int const nx        = 1;  // Number of cells in the x-direction
@@ -153,7 +153,7 @@
             // The HLLD solver only writes the the first two "slots" for
             // magnetic flux so let's rearrange to make sure we have all the
             // magnetic fluxes in the right spots
-            testFlux.insert(testFlux.begin() + magXIndex, 0.0);
+            testFlux.insert(testFlux.begin() + grid_enum::magnetic_x, 0.0);
             std::rotate(testFlux.begin() + 1, testFlux.begin() + 1 + direction, testFlux.begin() + 4);  // Rotate momentum
 
             return testFlux;
@@ -294,9 +294,9 @@
                                                                 output.at(1),
                                                                 output.at(2),
                                                                 output.at(3),
-                                                                output.at(5 + NSCALARS),
-                                                                output.at(6 + NSCALARS),
-                                                                output.at(7 + NSCALARS),
+                                                                output.at(grid_enum::magnetic_x),
+                                                                output.at(grid_enum::magnetic_y),
+                                                                output.at(grid_enum::magnetic_z),
                                                                 gamma));
             #endif  //DE
             return output;
@@ -1665,11 +1665,11 @@
             negativeDensityPressure.insert(negativeDensityPressure.begin()+5, conservedScalar.begin(), conservedScalar.begin() + NSCALARS);
         #endif  // SCALAR
         #ifdef  DE
-            negativePressure.push_back(mhd::utils::computeThermalEnergy(negativePressure.at(4),negativePressure.at(0),negativePressure.at(1),negativePressure.at(2),negativePressure.at(3),negativePressure.at(5 + NSCALARS),negativePressure.at(6 + NSCALARS),negativePressure.at(7 + NSCALARS),gamma));
-            negativeEnergy.push_back(mhd::utils::computeThermalEnergy(negativeEnergy.at(4),negativeEnergy.at(0),negativeEnergy.at(1),negativeEnergy.at(2),negativeEnergy.at(3),negativeEnergy.at(5 + NSCALARS),negativeEnergy.at(6 + NSCALARS),negativeEnergy.at(7 + NSCALARS),gamma));
-            negativeDensity.push_back(mhd::utils::computeThermalEnergy(negativeDensity.at(4),negativeDensity.at(0),negativeDensity.at(1),negativeDensity.at(2),negativeDensity.at(3),negativeDensity.at(5 + NSCALARS),negativeDensity.at(6 + NSCALARS),negativeDensity.at(7 + NSCALARS),gamma));
-            negativeDensityEnergyPressure.push_back(mhd::utils::computeThermalEnergy(negativeDensityEnergyPressure.at(4),negativeDensityEnergyPressure.at(0),negativeDensityEnergyPressure.at(1),negativeDensityEnergyPressure.at(2),negativeDensityEnergyPressure.at(3),negativeDensityEnergyPressure.at(5 + NSCALARS),negativeDensityEnergyPressure.at(6 + NSCALARS),negativeDensityEnergyPressure.at(7 + NSCALARS),gamma));
-            negativeDensityPressure.push_back(mhd::utils::computeThermalEnergy(negativeDensityPressure.at(4),negativeDensityPressure.at(0),negativeDensityPressure.at(1),negativeDensityPressure.at(2),negativeDensityPressure.at(3),negativeDensityPressure.at(5 + NSCALARS),negativeDensityPressure.at(6 + NSCALARS),negativeDensityPressure.at(7 + NSCALARS),gamma));
+            negativePressure.push_back(mhd::utils::computeThermalEnergy(negativePressure.at(4),negativePressure.at(0),negativePressure.at(1),negativePressure.at(2),negativePressure.at(3),negativePressure.at(grid_enum::magnetic_x),negativePressure.at(grid_enum::magnetic_y),negativePressure.at(grid_enum::magnetic_z),gamma));
+            negativeEnergy.push_back(mhd::utils::computeThermalEnergy(negativeEnergy.at(4),negativeEnergy.at(0),negativeEnergy.at(1),negativeEnergy.at(2),negativeEnergy.at(3),negativeEnergy.at(grid_enum::magnetic_x),negativeEnergy.at(grid_enum::magnetic_y),negativeEnergy.at(grid_enum::magnetic_z),gamma));
+            negativeDensity.push_back(mhd::utils::computeThermalEnergy(negativeDensity.at(4),negativeDensity.at(0),negativeDensity.at(1),negativeDensity.at(2),negativeDensity.at(3),negativeDensity.at(grid_enum::magnetic_x),negativeDensity.at(grid_enum::magnetic_y),negativeDensity.at(grid_enum::magnetic_z),gamma));
+            negativeDensityEnergyPressure.push_back(mhd::utils::computeThermalEnergy(negativeDensityEnergyPressure.at(4),negativeDensityEnergyPressure.at(0),negativeDensityEnergyPressure.at(1),negativeDensityEnergyPressure.at(2),negativeDensityEnergyPressure.at(3),negativeDensityEnergyPressure.at(grid_enum::magnetic_x),negativeDensityEnergyPressure.at(grid_enum::magnetic_y),negativeDensityEnergyPressure.at(grid_enum::magnetic_z),gamma));
+            negativeDensityPressure.push_back(mhd::utils::computeThermalEnergy(negativeDensityPressure.at(4),negativeDensityPressure.at(0),negativeDensityPressure.at(1),negativeDensityPressure.at(2),negativeDensityPressure.at(3),negativeDensityPressure.at(grid_enum::magnetic_x),negativeDensityPressure.at(grid_enum::magnetic_y),negativeDensityPressure.at(grid_enum::magnetic_z),gamma));
         #endif  //DE
 
         for (size_t direction = 0; direction < 3; direction++)
@@ -2532,8 +2532,8 @@
             int const fiducialMomentumIndexY = threadId + n_cells * o2;
             int const fiducialMomentumIndexZ = threadId + n_cells * o3;
             int const fiducialEnergyIndex    = threadId + n_cells * 4;
-            int const fiducialMagneticYIndex = threadId + n_cells * (5 + NSCALARS);
-            int const fiducialMagneticZIndex = threadId + n_cells * (6 + NSCALARS);
+            int const fiducialMagneticYIndex = threadId + n_cells * (grid_enum::magnetic_x);
+            int const fiducialMagneticZIndex = threadId + n_cells * (grid_enum::magnetic_y);
 
             mhd::_internal::_returnFluxes(threadId,
                                          o1,
diff --git a/src/utils/mhd_utilities.h b/src/utils/mhd_utilities.h
index d859ab1db..abe1c80e9 100644
--- a/src/utils/mhd_utilities.h
+++ b/src/utils/mhd_utilities.h
@@ -315,14 +315,14 @@ namespace utils{
         // fields on both sides then instead set the centered magnetic field to be
         // equal to the magnetic field of the closest edge. T
         avgBx = (xid > 0) ?
-            /*if true*/ 0.5 * (dev_conserved[(5+NSCALARS)*n_cells + id] + dev_conserved[(5+NSCALARS)*n_cells + cuda_utilities::compute1DIndex(xid-1, yid,   zid,   nx, ny)]):
-            /*if false*/       dev_conserved[(5+NSCALARS)*n_cells + id];
+            /*if true*/ 0.5 * (dev_conserved[(grid_enum::magnetic_x)*n_cells + id] + dev_conserved[(grid_enum::magnetic_x)*n_cells + cuda_utilities::compute1DIndex(xid-1, yid,   zid,   nx, ny)]):
+            /*if false*/       dev_conserved[(grid_enum::magnetic_x)*n_cells + id];
         avgBy = (yid > 0) ?
-            /*if true*/ 0.5 * (dev_conserved[(6+NSCALARS)*n_cells + id] + dev_conserved[(6+NSCALARS)*n_cells + cuda_utilities::compute1DIndex(xid,   yid-1, zid,   nx, ny)]):
-            /*if false*/       dev_conserved[(6+NSCALARS)*n_cells + id];
+            /*if true*/ 0.5 * (dev_conserved[(grid_enum::magnetic_y)*n_cells + id] + dev_conserved[(grid_enum::magnetic_y)*n_cells + cuda_utilities::compute1DIndex(xid,   yid-1, zid,   nx, ny)]):
+            /*if false*/       dev_conserved[(grid_enum::magnetic_y)*n_cells + id];
         avgBz = (zid > 0) ?
-            /*if true*/ 0.5 * (dev_conserved[(7+NSCALARS)*n_cells + id] + dev_conserved[(7+NSCALARS)*n_cells + cuda_utilities::compute1DIndex(xid,   yid,   zid-1, nx, ny)]):
-            /*if false*/       dev_conserved[(7+NSCALARS)*n_cells + id];
+            /*if true*/ 0.5 * (dev_conserved[(grid_enum::magnetic_z)*n_cells + id] + dev_conserved[(grid_enum::magnetic_z)*n_cells + cuda_utilities::compute1DIndex(xid,   yid,   zid-1, nx, ny)]):
+            /*if false*/       dev_conserved[(grid_enum::magnetic_z)*n_cells + id];
     }
     // =========================================================================
 } // end namespace mhd::utils

From 3121feaf3c0cd82c2af518fb5dd9a3661b8376fd Mon Sep 17 00:00:00 2001
From: Bob Caddy <r.Caddy@pitt.edu>
Date: Tue, 20 Dec 2022 17:21:11 -0500
Subject: [PATCH 03/18] Remove duplicate lines in the makefile

---
 Makefile | 3 ---
 1 file changed, 3 deletions(-)

diff --git a/Makefile b/Makefile
index dcc6d296c..f03a7478d 100644
--- a/Makefile
+++ b/Makefile
@@ -38,9 +38,6 @@ ifeq ($(TEST), true)
   CFLAGS   += $(TEST_FLAGS)
   CXXFLAGS += $(TEST_FLAGS)
   GPUFLAGS += $(TEST_FLAGS)
-  CFLAGS   += $(TEST_FLAGS)
-  CXXFLAGS += $(TEST_FLAGS)
-  GPUFLAGS += $(TEST_FLAGS)
 
   # HACK
   # Set the build flags to debug. This is mostly to avoid the approximations

From 27011bf49e9a2c4d001a91474ceb25f429afdcaf Mon Sep 17 00:00:00 2001
From: Bob Caddy <r.Caddy@pitt.edu>
Date: Tue, 20 Dec 2022 17:23:03 -0500
Subject: [PATCH 04/18] Remove HIP error limit when compiling

---
 Makefile | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/Makefile b/Makefile
index f03a7478d..9d302d693 100644
--- a/Makefile
+++ b/Makefile
@@ -134,7 +134,7 @@ ifdef HIPCONFIG
   DFLAGS    += -DO_HIP
   CXXFLAGS  += $(HIPCONFIG)
   GPUCXX    ?= hipcc
-  GPUFLAGS  += -Wall -ferror-limit=1
+  GPUFLAGS  += -Wall
   LD        := $(CXX)
   LDFLAGS   := $(CXXFLAGS) -L$(ROCM_PATH)/lib
   LIBS      += -lamdhip64

From 49aaef5904612f6896df08ad2449237d738ea09d Mon Sep 17 00:00:00 2001
From: Bob Caddy <r.Caddy@pitt.edu>
Date: Tue, 20 Dec 2022 17:45:00 -0500
Subject: [PATCH 05/18] Fix MHD usage of grid_enums so other builds will
 compile

---
 src/grid/grid_enum.h                   | 10 ++++++++--
 src/mhd/ct_electric_fields.cu          |  5 +++--
 src/mhd/ct_electric_fields.h           |  8 +++-----
 src/mhd/ct_electric_fields_tests.cu    |  2 ++
 src/mhd/magnetic_divergence.cu         |  5 +++--
 src/mhd/magnetic_divergence_tests.cu   |  2 ++
 src/mhd/magnetic_update.cu             |  5 +++--
 src/mhd/magnetic_update_tests.cu       |  2 ++
 src/riemann_solvers/hlld_cuda.cu       | 10 ++++------
 src/riemann_solvers/hlld_cuda_tests.cu |  4 +++-
 src/utils/mhd_utilities.h              |  2 ++
 src/utils/mhd_utilities_tests.cu       |  2 ++
 12 files changed, 37 insertions(+), 20 deletions(-)

diff --git a/src/grid/grid_enum.h b/src/grid/grid_enum.h
index 315533f5d..b96f0f4ca 100644
--- a/src/grid/grid_enum.h
+++ b/src/grid/grid_enum.h
@@ -68,7 +68,9 @@ enum : int {
   #endif
   num_fields,
 
-//Aliases and manually computed enums
+  //Aliases and manually computed enums
+  nscalars = finalscalar_plus_1 - scalar,
+  
   #ifdef  MHD
   num_flux_fields = num_fields-1,
   num_interface_fields = num_fields-1,
@@ -76,9 +78,11 @@ enum : int {
   num_flux_fields = num_fields,
   num_interface_fields = num_fields,
   #endif  //MHD
-  nscalars = finalscalar_plus_1 - scalar,
+
+  #ifdef MHD
   magnetic_start = magnetic_x,
   magnetic_end   = magnetic_z,
+
   // Note that the direction of the flux, the suffix _? indicates the direction of the electric field, not the magnetic flux
   fluxX_magnetic_z = magnetic_start,
   fluxX_magnetic_y = magnetic_start+1,
@@ -86,12 +90,14 @@ enum : int {
   fluxY_magnetic_z = magnetic_start+1,
   fluxZ_magnetic_y = magnetic_start,
   fluxZ_magnetic_x = magnetic_start+1,
+
   Q_x_magnetic_y = magnetic_start,
   Q_x_magnetic_z = magnetic_start+1,
   Q_y_magnetic_z = magnetic_start,
   Q_y_magnetic_x = magnetic_start+1,
   Q_z_magnetic_x = magnetic_start,
   Q_z_magnetic_y = magnetic_start+1
+  #endif  // MHD
 
 };
 }
diff --git a/src/mhd/ct_electric_fields.cu b/src/mhd/ct_electric_fields.cu
index 310da1be2..cd90ae2ac 100644
--- a/src/mhd/ct_electric_fields.cu
+++ b/src/mhd/ct_electric_fields.cu
@@ -11,7 +11,7 @@
 
 // Local Includes
 #include "../mhd/ct_electric_fields.h"
-
+#ifdef MHD
 namespace mhd
 {
    // =========================================================================
@@ -337,4 +337,5 @@ namespace mhd
         }
     }
     // =========================================================================
-} // end namespace mhd
\ No newline at end of file
+} // end namespace mhd
+#endif // MHD
diff --git a/src/mhd/ct_electric_fields.h b/src/mhd/ct_electric_fields.h
index 9e122d0dd..3db5927ad 100644
--- a/src/mhd/ct_electric_fields.h
+++ b/src/mhd/ct_electric_fields.h
@@ -17,10 +17,7 @@
 #include "../utils/gpu.hpp"
 #include "../utils/cuda_utilities.h"
 
-/*!
- * \brief Namespace for MHD code
- *
- */
+#ifdef MHD
 namespace mhd
 {
     /*!
@@ -152,4 +149,5 @@ namespace mhd
                                                  int const nz,
                                                  int const n_cells);
     // =========================================================================
-} // end  namespace mhd
\ No newline at end of file
+} // end  namespace mhd
+#endif // MHD
\ No newline at end of file
diff --git a/src/mhd/ct_electric_fields_tests.cu b/src/mhd/ct_electric_fields_tests.cu
index becbe2afa..5ba3a999a 100644
--- a/src/mhd/ct_electric_fields_tests.cu
+++ b/src/mhd/ct_electric_fields_tests.cu
@@ -20,6 +20,7 @@
 #include "../mhd/ct_electric_fields.h"
 #include "../global/global.h"
 
+#ifdef MHD
 // =============================================================================
 // Tests for the mhd::Calculate_CT_Electric_Fields kernel
 // =============================================================================
@@ -205,3 +206,4 @@ TEST_F(tMHDCalculateCTElectricFields,
     runTest();
 }
 // =============================================================================
+#endif // MHD
diff --git a/src/mhd/magnetic_divergence.cu b/src/mhd/magnetic_divergence.cu
index 0d8bf90a1..50aec4f1b 100644
--- a/src/mhd/magnetic_divergence.cu
+++ b/src/mhd/magnetic_divergence.cu
@@ -20,7 +20,7 @@
 #include "../utils/cuda_utilities.h"
 #include "../utils/reduction_utilities.h"
 #include "../utils/DeviceVector.h"
-
+#ifdef MHD
 namespace mhd
 {
     // =========================================================================
@@ -109,4 +109,5 @@ namespace mhd
         return dev_maxDivergence[0];
     }
     // =========================================================================
-} // end namespace mhd
\ No newline at end of file
+} // end namespace mhd
+#endif // MHD
diff --git a/src/mhd/magnetic_divergence_tests.cu b/src/mhd/magnetic_divergence_tests.cu
index ba2695e53..9751f6e0b 100644
--- a/src/mhd/magnetic_divergence_tests.cu
+++ b/src/mhd/magnetic_divergence_tests.cu
@@ -21,6 +21,7 @@
 #include "../utils/DeviceVector.h"
 #include "../global/global.h"
 
+#ifdef MHD
 // =============================================================================
 // Tests for the magnetic field divergence functions
 // =============================================================================
@@ -57,3 +58,4 @@ TEST(tMHDLaunchCalculateMagneticDivergence, CorrectInputExpectCorrectOutput)
 // =============================================================================
 // End of tests for the magnetic field divergence functions
 // =============================================================================
+#endif // MHD
diff --git a/src/mhd/magnetic_update.cu b/src/mhd/magnetic_update.cu
index fb6a89fec..550fb7188 100644
--- a/src/mhd/magnetic_update.cu
+++ b/src/mhd/magnetic_update.cu
@@ -12,7 +12,7 @@
 // Local Includes
 #include "../mhd/magnetic_update.h"
 #include "../utils/cuda_utilities.h"
-
+#ifdef MHD
 namespace mhd
 {
     // =========================================================================
@@ -77,4 +77,5 @@ namespace mhd
         }
     }
     // =========================================================================
-} // end namespace mhd
\ No newline at end of file
+} // end namespace mhd
+#endif // MHD
diff --git a/src/mhd/magnetic_update_tests.cu b/src/mhd/magnetic_update_tests.cu
index 7cb4f68f2..bebef2621 100644
--- a/src/mhd/magnetic_update_tests.cu
+++ b/src/mhd/magnetic_update_tests.cu
@@ -19,6 +19,7 @@
 #include "../utils/cuda_utilities.h"
 #include "../mhd/magnetic_update.h"
 
+#ifdef MHD
 // =============================================================================
 /*!
  * \brief Test fixture for tMHDUpdateMagneticField3D test suite
@@ -148,3 +149,4 @@ TEST_F(tMHDUpdateMagneticField3D,
     runTest();
 }
 // =============================================================================
+#endif // MHD
diff --git a/src/riemann_solvers/hlld_cuda.cu b/src/riemann_solvers/hlld_cuda.cu
index 18fe8578e..a7793150b 100644
--- a/src/riemann_solvers/hlld_cuda.cu
+++ b/src/riemann_solvers/hlld_cuda.cu
@@ -23,10 +23,8 @@
 #endif // DE
 
 #ifdef CUDA
-/*!
- * \brief Namespace for MHD code
- *
- */
+
+#ifdef MHD
 namespace mhd
 {
     // =========================================================================
@@ -912,5 +910,5 @@ namespace mhd
 
     } // mhd::_internal namespace
 } // end namespace mhd
-
-#endif // CUDA
\ No newline at end of file
+#endif // MHD
+#endif // CUDA
diff --git a/src/riemann_solvers/hlld_cuda_tests.cu b/src/riemann_solvers/hlld_cuda_tests.cu
index ad4ac1547..a6ec74358 100644
--- a/src/riemann_solvers/hlld_cuda_tests.cu
+++ b/src/riemann_solvers/hlld_cuda_tests.cu
@@ -23,6 +23,7 @@
 #include "../riemann_solvers/hlld_cuda.h"   // Include code to test
 
 #ifdef CUDA
+#ifdef MHD
     // =========================================================================
     // Integration tests for the entire HLLD solver. Unit tests are below
     // =========================================================================
@@ -2578,4 +2579,5 @@
         }
     }
     // =========================================================================
-#endif  // CUDA
\ No newline at end of file
+#endif // MHD
+#endif  // CUDA
diff --git a/src/utils/mhd_utilities.h b/src/utils/mhd_utilities.h
index abe1c80e9..6b587e535 100644
--- a/src/utils/mhd_utilities.h
+++ b/src/utils/mhd_utilities.h
@@ -282,6 +282,7 @@ namespace utils{
     // =========================================================================
 
     // =========================================================================
+    #ifdef MHD
     /*!
      * \brief Compute the cell centered average of the magnetic fields in a
      * given cell
@@ -324,6 +325,7 @@ namespace utils{
             /*if true*/ 0.5 * (dev_conserved[(grid_enum::magnetic_z)*n_cells + id] + dev_conserved[(grid_enum::magnetic_z)*n_cells + cuda_utilities::compute1DIndex(xid,   yid,   zid-1, nx, ny)]):
             /*if false*/       dev_conserved[(grid_enum::magnetic_z)*n_cells + id];
     }
+    #endif // MHD
     // =========================================================================
 } // end namespace mhd::utils
 } // end namespace mhd
\ No newline at end of file
diff --git a/src/utils/mhd_utilities_tests.cu b/src/utils/mhd_utilities_tests.cu
index d56ae2bad..dcbbebca8 100644
--- a/src/utils/mhd_utilities_tests.cu
+++ b/src/utils/mhd_utilities_tests.cu
@@ -505,6 +505,7 @@ TEST(tMHDAlfvenSpeed,
 // =============================================================================
 // Tests for the mhd::utils::cellCenteredMagneticFields function
 // =============================================================================
+#ifdef MHD
 TEST(tMHDCellCenteredMagneticFields,
      CorrectInputExpectCorrectOutput)
 {
@@ -536,6 +537,7 @@ TEST(tMHDCellCenteredMagneticFields,
     testingUtilities::checkResults(fiducialAvgBy, testAvgBy, "cell centered By value");
     testingUtilities::checkResults(fiducialAvgBz, testAvgBz, "cell centered Bz value");
 }
+#endif // MHD
 // =============================================================================
 // End of tests for the mhd::utils::cellCenteredMagneticFields function
 // =============================================================================

From 095b619ac4e909fbb937e4e8fa96cb3e2936a749 Mon Sep 17 00:00:00 2001
From: Bob Caddy <r.Caddy@pitt.edu>
Date: Tue, 20 Dec 2022 17:58:32 -0500
Subject: [PATCH 06/18] Finish replacing NSCALARS in MHD test code

Note: The scalar loops in PCM and the HLLD solver haven't been touched
---
 src/mhd/ct_electric_fields_tests.cu    |  2 +-
 src/mhd/magnetic_update_tests.cu       |  6 +++---
 src/riemann_solvers/hlld_cuda_tests.cu | 22 +++++++++++-----------
 src/utils/mhd_utilities_tests.cu       |  2 +-
 4 files changed, 16 insertions(+), 16 deletions(-)

diff --git a/src/mhd/ct_electric_fields_tests.cu b/src/mhd/ct_electric_fields_tests.cu
index 5ba3a999a..b526ab7e0 100644
--- a/src/mhd/ct_electric_fields_tests.cu
+++ b/src/mhd/ct_electric_fields_tests.cu
@@ -48,7 +48,7 @@ public:
         fluxX(n_cells * (grid_enum::num_flux_fields)),
         fluxY(n_cells * (grid_enum::num_flux_fields)),
         fluxZ(n_cells * (grid_enum::num_flux_fields)),
-        grid (n_cells * (8+NSCALARS)),
+        grid (n_cells * (grid_enum::num_fields)),
         testCTElectricFields(n_cells * 3, -999.),
         fiducialData(n_cells * 3, -999.),
         dimGrid((n_cells + TPB - 1),1,1),
diff --git a/src/mhd/magnetic_update_tests.cu b/src/mhd/magnetic_update_tests.cu
index bebef2621..501803e1c 100644
--- a/src/mhd/magnetic_update_tests.cu
+++ b/src/mhd/magnetic_update_tests.cu
@@ -44,10 +44,10 @@ public:
         dx(2.5),
         dy(2.5),
         dz(2.5),
-        sourceGrid      (n_cells * (8+NSCALARS)),
-        destinationGrid (n_cells * (8+NSCALARS), -999.),
+        sourceGrid      (n_cells * (grid_enum::num_fields)),
+        destinationGrid (n_cells * (grid_enum::num_fields), -999.),
         ctElectricFields(n_cells * 3),
-        fiducialData    (n_cells * (8+NSCALARS), -999.),
+        fiducialData    (n_cells * (grid_enum::num_fields), -999.),
         dimGrid((n_cells + TPB - 1),1,1),
         dimBlock(TPB,1,1)
     {
diff --git a/src/riemann_solvers/hlld_cuda_tests.cu b/src/riemann_solvers/hlld_cuda_tests.cu
index a6ec74358..0de90e6f9 100644
--- a/src/riemann_solvers/hlld_cuda_tests.cu
+++ b/src/riemann_solvers/hlld_cuda_tests.cu
@@ -204,13 +204,13 @@
             #endif  //DE
             #ifdef  SCALAR
                 std::vector<std::string> scalarNames{"Scalar 1", "Scalar 2", "Scalar 3"};
-                fieldNames.insert(fieldNames.begin()+5,
+                fieldNames.insert(fieldNames.begin() + grid_enum::magnetic_start,
                                   scalarNames.begin(),
-                                  scalarNames.begin() + NSCALARS);
+                                  scalarNames.begin() + grid_enum::nscalars);
 
-                fiducialFlux.insert(fiducialFlux.begin()+5,
+                fiducialFlux.insert(fiducialFlux.begin() + grid_enum::magnetic_start,
                                     scalarFlux.begin(),
-                                    scalarFlux.begin() + NSCALARS);
+                                    scalarFlux.begin() + grid_enum::nscalars);
             #endif  //SCALAR
 
             ASSERT_TRUE(    (fiducialFlux.size() == testFlux.size())
@@ -285,9 +285,9 @@
                                primitiveScalars.end(),
                                conservedScalar.begin(),
                                [&](Real const &c){ return c*output.at(0); });
-                output.insert(output.begin()+5,
+                output.insert(output.begin() + grid_enum::magnetic_start,
                               conservedScalar.begin(),
-                              conservedScalar.begin() + NSCALARS);
+                              conservedScalar.begin() + grid_enum::nscalars);
             #endif //SCALAR
             #ifdef  DE
                 output.push_back(mhd::utils::computeThermalEnergy(output.at(4),
@@ -1659,11 +1659,11 @@
 
         #ifdef SCALAR
             std::vector<Real> const conservedScalar{1.1069975296, 2.2286185018, 3.3155141875};
-            negativePressure.insert(negativePressure.begin()+5, conservedScalar.begin(), conservedScalar.begin() + NSCALARS);
-            negativeEnergy.insert(negativeEnergy.begin()+5, conservedScalar.begin(), conservedScalar.begin() + NSCALARS);
-            negativeDensity.insert(negativeDensity.begin()+5, conservedScalar.begin(), conservedScalar.begin() + NSCALARS);
-            negativeDensityEnergyPressure.insert(negativeDensityEnergyPressure.begin()+5, conservedScalar.begin(), conservedScalar.begin() + NSCALARS);
-            negativeDensityPressure.insert(negativeDensityPressure.begin()+5, conservedScalar.begin(), conservedScalar.begin() + NSCALARS);
+            negativePressure.insert(negativePressure.begin()+5, conservedScalar.begin(), conservedScalar.begin() + grid_enum::nscalars);
+            negativeEnergy.insert(negativeEnergy.begin()+5, conservedScalar.begin(), conservedScalar.begin() + grid_enum::nscalars);
+            negativeDensity.insert(negativeDensity.begin()+5, conservedScalar.begin(), conservedScalar.begin() + grid_enum::nscalars);
+            negativeDensityEnergyPressure.insert(negativeDensityEnergyPressure.begin()+5, conservedScalar.begin(), conservedScalar.begin() + grid_enum::nscalars);
+            negativeDensityPressure.insert(negativeDensityPressure.begin()+5, conservedScalar.begin(), conservedScalar.begin() + grid_enum::nscalars);
         #endif  // SCALAR
         #ifdef  DE
             negativePressure.push_back(mhd::utils::computeThermalEnergy(negativePressure.at(4),negativePressure.at(0),negativePressure.at(1),negativePressure.at(2),negativePressure.at(3),negativePressure.at(grid_enum::magnetic_x),negativePressure.at(grid_enum::magnetic_y),negativePressure.at(grid_enum::magnetic_z),gamma));
diff --git a/src/utils/mhd_utilities_tests.cu b/src/utils/mhd_utilities_tests.cu
index dcbbebca8..d07b690d4 100644
--- a/src/utils/mhd_utilities_tests.cu
+++ b/src/utils/mhd_utilities_tests.cu
@@ -517,7 +517,7 @@ TEST(tMHDCellCenteredMagneticFields,
     size_t const n_cells = std::pow(5,3);
     // Make sure the vector is large enough that the locations where the
     // magnetic field would be in the real grid are filled
-    std::vector<double> testGrid(n_cells * (8+NSCALARS));
+    std::vector<double> testGrid(n_cells * (grid_enum::num_fields));
     // Populate the grid with values where testGrid.at(i) = double(i). The
     // values chosen aren't that important, just that every cell has a unique
     // value

From 379b86e15def7090e5aeceb95bb5c2ea81bd8148 Mon Sep 17 00:00:00 2001
From: Alwin <alwin.mao@pitt.edu>
Date: Tue, 20 Dec 2022 17:11:38 -0800
Subject: [PATCH 07/18] Change a few comments and make dust compile on crusher

---
 src/dust/dust_cuda.cu           | 4 ++--
 src/hydro/hydro_cuda.cu         | 1 +
 src/utils/reduction_utilities.h | 2 --
 3 files changed, 3 insertions(+), 4 deletions(-)

diff --git a/src/dust/dust_cuda.cu b/src/dust/dust_cuda.cu
index 524b58cd0..50356c3c5 100644
--- a/src/dust/dust_cuda.cu
+++ b/src/dust/dust_cuda.cu
@@ -111,7 +111,7 @@ __global__ void Dust_Kernel(Real *dev_conserved, int nx, int ny, int nz, int n_g
 }
 
 // McKinnon et al. (2017)
-__device__ Real calc_tau_sp(Real n, Real T) {
+__device__ __host__ Real calc_tau_sp(Real n, Real T) {
   Real YR_IN_S = 3.154e7;
   Real a1 = 1; // dust grain size in units of 0.1 micrometers
   Real d0 = n / (6e-4); // gas density in units of 10^-27 g/cm^3
@@ -125,7 +125,7 @@ __device__ Real calc_tau_sp(Real n, Real T) {
 }
 
 // McKinnon et al. (2017)
-__device__ Real calc_dd_dt(Real d_dust, Real tau_sp) {
+__device__ __host__ Real calc_dd_dt(Real d_dust, Real tau_sp) {
     return -d_dust / (tau_sp/3);
 }
 
diff --git a/src/hydro/hydro_cuda.cu b/src/hydro/hydro_cuda.cu
index add8af96a..3b60f97f9 100644
--- a/src/hydro/hydro_cuda.cu
+++ b/src/hydro/hydro_cuda.cu
@@ -604,6 +604,7 @@ Real Calc_dt_GPU(Real *dev_conserved, int nx, int ny, int nz, int n_ghost, int n
   }
   CudaCheckError();
 
+  // Note: dev_dti[0] is DeviceVector syntactic sugar for returning a value via cudaMemcpy
   return dev_dti[0];
 }
 
diff --git a/src/utils/reduction_utilities.h b/src/utils/reduction_utilities.h
index 9aef9600d..39089ac2e 100644
--- a/src/utils/reduction_utilities.h
+++ b/src/utils/reduction_utilities.h
@@ -267,8 +267,6 @@
          */
         __inline__ __device__ void gridReduceMax(Real val, Real* out)
         {
-            // __syncthreads();  // Wait for all threads to calculate val;
-            // __syncthreads();  // Wait for all threads to calculate val;
 
             // Reduce the entire block in parallel
             val = blockReduceMax(val);

From 9ea73366ac94fa75399d7516cf49c11304ede3c1 Mon Sep 17 00:00:00 2001
From: Alwin <alwin.mao@pitt.edu>
Date: Tue, 20 Dec 2022 17:25:13 -0800
Subject: [PATCH 08/18] change -Wall and -Wno-unused-result order for frontier
 builds to reduce warnings

---
 Makefile                        | 2 +-
 builds/make.host.frontier       | 4 ++--
 src/grid/initial_conditions.cpp | 2 +-
 3 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/Makefile b/Makefile
index 9d302d693..fa2bc4500 100644
--- a/Makefile
+++ b/Makefile
@@ -134,7 +134,7 @@ ifdef HIPCONFIG
   DFLAGS    += -DO_HIP
   CXXFLAGS  += $(HIPCONFIG)
   GPUCXX    ?= hipcc
-  GPUFLAGS  += -Wall
+  #GPUFLAGS  += -Wall
   LD        := $(CXX)
   LDFLAGS   := $(CXXFLAGS) -L$(ROCM_PATH)/lib
   LIBS      += -lamdhip64
diff --git a/builds/make.host.frontier b/builds/make.host.frontier
index c225b3655..69f715871 100644
--- a/builds/make.host.frontier
+++ b/builds/make.host.frontier
@@ -11,8 +11,8 @@ CFLAGS_OPTIMIZE   = -g -O2
 CXXFLAGS_DEBUG    = -g -O0 -std=c++17
 CXXFLAGS_OPTIMIZE = -g -Ofast -std=c++17 -Wno-unused-result
 
-GPUFLAGS_OPTIMIZE = -std=c++17 --offload-arch=gfx90a -Wno-unused-result
-GPUFLAGS_DEBUG    = -g -O0 -std=c++17 --offload-arch=gfx90a -Wno-unused-result
+GPUFLAGS_OPTIMIZE = -std=c++17 --offload-arch=gfx90a -Wall -Wno-unused-result
+GPUFLAGS_DEBUG    = -g -O0 -std=c++17 --offload-arch=gfx90a -Wall -Wno-unused-result
 HIPCONFIG	  = -I$(ROCM_PATH)/include $(shell hipconfig -C) # workaround for Rocm 5.2 warnings
 #HIPCONFIG	  = $(shell hipconfig -C)
 
diff --git a/src/grid/initial_conditions.cpp b/src/grid/initial_conditions.cpp
index 5d98d8367..8c8c5b3f9 100644
--- a/src/grid/initial_conditions.cpp
+++ b/src/grid/initial_conditions.cpp
@@ -1,5 +1,5 @@
 /*! \file initial_conditions.cpp
-/*  \brief Definitions of initial conditions for different tests.
+ *  \brief Definitions of initial conditions for different tests.
            Note that the grid is mapped to 1D as i + (x_dim)*j + (x_dim*y_dim)*k.
            Functions are members of the Grid3D class. */
 

From e9c610526f7bb4e0bd33bb0b35db1734d4158b97 Mon Sep 17 00:00:00 2001
From: Bob Caddy <r.Caddy@pitt.edu>
Date: Mon, 2 Jan 2023 12:47:06 -0500
Subject: [PATCH 09/18] Move magnetic divergence out of grid3D.cpp

All the magnetic divergence stuff now lives in the magnetic_divergence*
files. I also simplified the functions a bit
---
 src/grid/grid3D.cpp                  | 38 --------------
 src/grid/grid3D.h                    | 11 ++--
 src/main.cpp                         |  4 +-
 src/mhd/magnetic_divergence.cu       | 76 ++++++++++++++++++----------
 src/mhd/magnetic_divergence.h        | 27 ----------
 src/mhd/magnetic_divergence_tests.cu | 37 +++++++++-----
 6 files changed, 82 insertions(+), 111 deletions(-)

diff --git a/src/grid/grid3D.cpp b/src/grid/grid3D.cpp
index bd67e87e6..8025f3744 100644
--- a/src/grid/grid3D.cpp
+++ b/src/grid/grid3D.cpp
@@ -43,11 +43,6 @@
 #include "../dust/dust_cuda.h" // provides Dust_Update
 #endif
 
-#ifdef  MHD
-  #include "../mhd/magnetic_divergence.h"
-#endif  //MHD
-
-
 /*! \fn Grid3D(void)
  *  \brief Constructor for the Grid. */
 Grid3D::Grid3D(void)
@@ -609,39 +604,6 @@ void Grid3D::Update_Time(){
 
 }
 
-#ifdef  MHD
-  void Grid3D::checkMagneticDivergence(Grid3D &G, struct parameters P, int nfile)
-  {
-    // Compute the local value of the divergence
-    H.max_magnetic_divergence = mhd::launchCalculateMagneticDivergence(C.device, H.dx, H.dy, H.dz, H.nx, H.ny, H.nz, H.n_cells);
-
-    #ifdef  MPI_CHOLLA
-      // Now that we have the local maximum let's get the global maximum
-      H.max_magnetic_divergence =  ReduceRealMax(H.max_magnetic_divergence);
-    #endif  //MPI_CHOLLA
-
-    // If the magnetic divergence is greater than the limit then raise a warning and exit
-    if (H.max_magnetic_divergence > H.magnetic_divergence_limit)
-    {
-      // Report the error and exit
-      chprintf("The magnetic divergence has exceeded the maximum allowed value. Divergence = %7.4e, the maximum allowed divergence = %7.4e\n",
-               H.max_magnetic_divergence, H.magnetic_divergence_limit);
-      chexit(-1);
-    }
-    else if (H.max_magnetic_divergence < 0.0)
-    {
-      // Report the error and exit
-      chprintf("The magnetic divergence is negative. Divergence = %7.4e\n",
-               H.max_magnetic_divergence);
-      chexit(-1);
-    }
-    else  // The magnetic divergence is within acceptable bounds
-    {
-      chprintf("Global maximum magnetic divergence = %7.4e\n", H.max_magnetic_divergence);
-    }
-  }
-#endif  //MHD
-
 /*! \fn void Reset(void)
  *  \brief Reset the Grid3D class. */
 void Grid3D::Reset(void)
diff --git a/src/grid/grid3D.h b/src/grid/grid3D.h
index c98971189..6e8fb4c94 100644
--- a/src/grid/grid3D.h
+++ b/src/grid/grid3D.h
@@ -412,7 +412,7 @@ class Grid3D
       /*! pointer to conserved variable on device */
       Real *device;
       Real *d_density, *d_momentum_x, *d_momentum_y, *d_momentum_z,
-	   *d_Energy, *d_scalar, *d_basic_scalar, 
+	   *d_Energy, *d_scalar, *d_basic_scalar,
 	   *d_magnetic_x, *d_magnetic_y, *d_magnetic_z,
            *d_GasEnergy;
 
@@ -466,7 +466,12 @@ class Grid3D
     void Update_Time();
 
     #ifdef  MHD
-      void checkMagneticDivergence(Grid3D &G, struct parameters P, int nfile);
+      /*!
+       * \brief Compute the maximum magnetic divergence in the grid and report
+       * an error if it exceeds Grid3D::H::magnetic_divergence_limit or is
+       * negative.
+       */
+      void checkMagneticDivergence();
     #endif  //MHD
 
      /*! \fn void Write_Header_Text(FILE *fp)
@@ -679,7 +684,7 @@ class Grid3D
     void Spherical_Overdensity_3D();
 
     void Clouds();
-    
+
     void Uniform_Grid();
 
     void Zeldovich_Pancake( struct parameters P );
diff --git a/src/main.cpp b/src/main.cpp
index 5ee396965..48dd32c70 100644
--- a/src/main.cpp
+++ b/src/main.cpp
@@ -193,7 +193,7 @@ int main(int argc, char *argv[])
 
   #ifdef  MHD
     // Check that the initial magnetic field has zero divergence
-    G.checkMagneticDivergence(G, P, nfile);
+    G.checkMagneticDivergence();
   #endif  //MHD
 
   // increment the next output time
@@ -339,7 +339,7 @@ int main(int argc, char *argv[])
 
     #ifdef  MHD
       // Check that the magnetic field has zero divergence
-      G.checkMagneticDivergence(G, P, nfile);
+      G.checkMagneticDivergence();
     #endif  //MHD
   } /*end loop over timesteps*/
 
diff --git a/src/mhd/magnetic_divergence.cu b/src/mhd/magnetic_divergence.cu
index 50aec4f1b..642cba86d 100644
--- a/src/mhd/magnetic_divergence.cu
+++ b/src/mhd/magnetic_divergence.cu
@@ -16,11 +16,15 @@
 // External Includes
 
 // Local Includes
+#include "../grid/grid3D.h"
+#include "../io/io.h"
 #include "../mhd/magnetic_divergence.h"
 #include "../utils/cuda_utilities.h"
 #include "../utils/reduction_utilities.h"
 #include "../utils/DeviceVector.h"
+#include "../utils/error_handling.h"
 #ifdef MHD
+
 namespace mhd
 {
     // =========================================================================
@@ -77,37 +81,53 @@ namespace mhd
         reduction_utilities::gridReduceMax(maxDivergence, dev_maxDivergence);
     }
     // =========================================================================
+} // end namespace mhd
 
-    // =========================================================================
-    Real launchCalculateMagneticDivergence(Real const *dev_conserved,
-                                           Real const dx,
-                                           Real const dy,
-                                           Real const dz,
-                                           int const nx,
-                                           int const ny,
-                                           int const nz,
-                                           int const n_cells)
-    {
-        // First let's create some variables we'll need.
-        cuda_utilities::AutomaticLaunchParams static const launchParams(mhd::calculateMagneticDivergence);
-        cuda_utilities::DeviceVector<Real> static dev_maxDivergence(1);
+// =============================================================================
+void Grid3D::checkMagneticDivergence()
+{
+    // Compute the local value of the divergence
+    // First let's create some variables we'll need.
+    cuda_utilities::AutomaticLaunchParams static const launchParams(mhd::calculateMagneticDivergence);
+    cuda_utilities::DeviceVector<Real> static dev_maxDivergence(1);
+
+    // Set the device side inverse time step to the smallest possible double
+    // so that the reduction isn't using the maximum value of the previous
+    // iteration
+    dev_maxDivergence.assign(std::numeric_limits<Real>::lowest());
 
-        // Set the device side inverse time step to the smallest possible double
-        // so that the reduction isn't using the maximum value of the previous
-        // iteration
-        dev_maxDivergence.assign(std::numeric_limits<Real>::lowest());
+    // Now lets get the local maximum divergence
+    hipLaunchKernelGGL(mhd::calculateMagneticDivergence,
+                        launchParams.numBlocks, launchParams.threadsPerBlock, 0, 0,
+                        C.device, dev_maxDivergence.data(),
+                        H.dx, H.dy, H.dz,
+                        H.nx, H.ny, H.nz,
+                        H.n_cells);
+    CudaCheckError();
+    H.max_magnetic_divergence = dev_maxDivergence[0];
 
-        // Now lets get the local maximum divergence
-        hipLaunchKernelGGL(mhd::calculateMagneticDivergence,
-                           launchParams.numBlocks, launchParams.threadsPerBlock, 0, 0,
-                           dev_conserved, dev_maxDivergence.data(),
-                           dx, dy, dz,
-                           nx, ny, nz,
-                           n_cells);
-        CudaCheckError();
+    #ifdef  MPI_CHOLLA
+    // Now that we have the local maximum let's get the global maximum
+    H.max_magnetic_divergence = ReduceRealMax(H.max_magnetic_divergence);
+    #endif  //MPI_CHOLLA
 
-        return dev_maxDivergence[0];
+    // If the magnetic divergence is greater than the limit then raise a warning and exit
+    if (H.max_magnetic_divergence > H.magnetic_divergence_limit)
+    {
+        // Report the error and exit
+        chprintf("The magnetic divergence has exceeded the maximum allowed value. Divergence = %7.4e, the maximum allowed divergence = %7.4e\n", H.max_magnetic_divergence, H.magnetic_divergence_limit);
+        chexit(-1);
     }
-    // =========================================================================
-} // end namespace mhd
+    else if (H.max_magnetic_divergence < 0.0)
+    {
+        // Report the error and exit
+        chprintf("The magnetic divergence is negative. Divergence = %7.4e\n", H.max_magnetic_divergence);
+        chexit(-1);
+    }
+    else  // The magnetic divergence is within acceptable bounds
+    {
+        chprintf("Global maximum magnetic divergence = %7.4e\n", H.max_magnetic_divergence);
+    }
+}
+// =============================================================================
 #endif // MHD
diff --git a/src/mhd/magnetic_divergence.h b/src/mhd/magnetic_divergence.h
index 8550591e2..304bf0823 100644
--- a/src/mhd/magnetic_divergence.h
+++ b/src/mhd/magnetic_divergence.h
@@ -51,31 +51,4 @@ namespace mhd
                                                 int const nz,
                                                 int const n_cells);
     // =========================================================================
-
-    // =========================================================================
-    /*!
-     * \brief Handling launching and returning the value from the
-     * `mhd::calculateMagneticDivergence` kernel
-     *
-     * \param[in] dev_conserved The device array of conserved variables
-     * \param[in] dx Cell size in the X-direction
-     * \param[in] dy Cell size in the Y-direction
-     * \param[in] dz Cell size in the Z-direction
-     * \param[in] nx Number of cells in the X-direction
-     * \param[in] ny Number of cells in the Y-direction
-     * \param[in] nz Number of cells in the Z-direction
-     * \param[in] n_cells Total number of cells
-     * \return Real The maximum divergence of the magnetic field in the local
-     * part of the grid
-     */
-    Real launchCalculateMagneticDivergence(Real const *dev_conserved,
-                                           Real const dx,
-                                           Real const dy,
-                                           Real const dz,
-                                           int const nx,
-                                           int const ny,
-                                           int const nz,
-                                           int const n_cells);
-    // =========================================================================
-
 } // end namespace mhd
\ No newline at end of file
diff --git a/src/mhd/magnetic_divergence_tests.cu b/src/mhd/magnetic_divergence_tests.cu
index 9751f6e0b..3b1704aad 100644
--- a/src/mhd/magnetic_divergence_tests.cu
+++ b/src/mhd/magnetic_divergence_tests.cu
@@ -17,6 +17,7 @@
 
 // Local Includes
 #include "../utils/testing_utilities.h"
+#include "../grid/grid3D.h"
 #include "../mhd/magnetic_divergence.h"
 #include "../utils/DeviceVector.h"
 #include "../global/global.h"
@@ -25,35 +26,45 @@
 // =============================================================================
 // Tests for the magnetic field divergence functions
 // =============================================================================
-TEST(tMHDLaunchCalculateMagneticDivergence, CorrectInputExpectCorrectOutput)
+TEST(tMHDGrid3DcheckMagneticDivergence, CorrectInputExpectCorrectOutput)
 {
     // Grid Parameters & testing parameters
     size_t const gridSize = 96; // Needs to be at least 64 so that each thread has a value
     size_t const n_ghost  = 4;
-    size_t const nx       = gridSize+2*n_ghost, ny = nx, nz = nx;
-    size_t const n_cells  = nx*ny*nz;
-    size_t const n_fields = 8;
-    Real   const dx       = 3, dy = dx, dz = dx;
-    std::vector<Real> host_grid(n_cells*n_fields);
 
-    // Fill grid with random values and randomly assign maximum value
+    // Instantiate Grid3D object
+    Grid3D G;
+    G.H.dx       = 3;
+    G.H.dy       = G.H.dx;
+    G.H.dz       = G.H.dx;
+    G.H.nx       = gridSize+2*n_ghost;
+    G.H.ny       = G.H.nx;
+    G.H.nz       = G.H.nx;
+    G.H.n_cells  = G.H.nx * G.H.ny * G.H.nz;
+    G.H.n_fields = 8;
+
+    // Setup host grid. Fill host grid with random values and randomly assign
+    // maximum value
+    std::vector<Real> host_grid(G.H.n_cells * G.H.n_fields);
     std::mt19937 prng(1);
     std::uniform_real_distribution<double> doubleRand(1, 5);
     for (size_t i = 0; i < host_grid.size(); i++)
     {
-        host_grid.at(i) = doubleRand(prng);
+        host_grid.at(i) = doubleRand(prng) / 1E15;
     }
 
     // Allocating and copying to device
     cuda_utilities::DeviceVector<double> dev_grid(host_grid.size());
+    G.C.device   = dev_grid.data();
     dev_grid.cpyHostToDevice(host_grid);
 
-    // Get test data
-    Real testDivergence = mhd::launchCalculateMagneticDivergence(dev_grid.data(), dx, dy, dz, nx, ny, nz, n_cells);
-
+    // Perform test
+    InitializeChollaMPI(NULL, NULL);
+    G.checkMagneticDivergence();
+    MPI_Finalize();
     // Perform Comparison
-    Real const fiducialDivergence = 3.6318132783263106;
-    testingUtilities::checkResults(fiducialDivergence, testDivergence, "maximum divergence");
+    Real const fiducialDivergence = 3.6318132783263106 / 1E15;
+    testingUtilities::checkResults(fiducialDivergence, G.H.max_magnetic_divergence, "maximum divergence");
 }
 // =============================================================================
 // End of tests for the magnetic field divergence functions

From 9b17a930653cb3de357de66f49db67ad82824602 Mon Sep 17 00:00:00 2001
From: Bob Caddy <r.Caddy@pitt.edu>
Date: Mon, 2 Jan 2023 14:07:03 -0500
Subject: [PATCH 10/18] Reduce the number of make jobs in run_tests.sh

Reduced the number of jobs launched to match the number of threads
available. Will hopefully reduce memory pressure in github actions builds
---
 builds/run_tests.sh | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/builds/run_tests.sh b/builds/run_tests.sh
index 519c9d928..80fcab2a1 100755
--- a/builds/run_tests.sh
+++ b/builds/run_tests.sh
@@ -110,7 +110,7 @@ buildCholla ()
 {
   echo -e "\nBuilding Cholla...\n"
   builtin cd $CHOLLA_ROOT
-  make -j TYPE=${CHOLLA_MAKE_TYPE} BUILD=${1}
+  make --jobs=$(nproc) TYPE=${CHOLLA_MAKE_TYPE} BUILD=${1}
 }
 # ==============================================================================
 
@@ -121,7 +121,7 @@ buildChollaTests ()
 {
   echo
   builtin cd $CHOLLA_ROOT
-  make -j TYPE=${CHOLLA_MAKE_TYPE} TEST=true
+  make --jobs=$(nproc) TYPE=${CHOLLA_MAKE_TYPE} TEST=true
 }
 # ==============================================================================
 

From 7ffad0728cca4fbaf2de0c7859639cf5e8872639 Mon Sep 17 00:00:00 2001
From: Bob Caddy <r.Caddy@pitt.edu>
Date: Thu, 5 Jan 2023 11:08:00 -0500
Subject: [PATCH 11/18] Move magnetic divergence out of Grid3D and into MHD

The divergence calculations have all been moved out of Grid3D and into
the `mhd` namespace. There wasn't any real reason for it to be in
Grid3D and now all the MHD stuff is in the `mhd` namespace
---
 src/grid/grid3D.h                    | 18 +----------------
 src/main.cpp                         |  7 +++++--
 src/mhd/magnetic_divergence.cu       | 29 +++++++++++++++-------------
 src/mhd/magnetic_divergence.h        | 16 +++++++++++++++
 src/mhd/magnetic_divergence_tests.cu |  5 ++---
 5 files changed, 40 insertions(+), 35 deletions(-)

diff --git a/src/grid/grid3D.h b/src/grid/grid3D.h
index 6e8fb4c94..d05b90214 100644
--- a/src/grid/grid3D.h
+++ b/src/grid/grid3D.h
@@ -245,12 +245,6 @@ struct Header
   Real sphere_center_y;
   Real sphere_center_z;
 
-  #ifdef  MHD
-    Real max_magnetic_divergence;
-    Real const magnetic_divergence_limit = 1.0E-14;
-  #endif  //MHD
-
-
   #ifdef GRAVITY
   /*! \var n_ghost_potential_offset
   *  \brief Number of offset betewen hydro_ghost_cells and potential_ghost_cells */
@@ -464,17 +458,7 @@ class Grid3D
     Real Update_Hydro_Grid(void);
 
     void Update_Time();
-
-    #ifdef  MHD
-      /*!
-       * \brief Compute the maximum magnetic divergence in the grid and report
-       * an error if it exceeds Grid3D::H::magnetic_divergence_limit or is
-       * negative.
-       */
-      void checkMagneticDivergence();
-    #endif  //MHD
-
-     /*! \fn void Write_Header_Text(FILE *fp)
+    /*! \fn void Write_Header_Text(FILE *fp)
      *  \brief Write the relevant header info to a text output file. */
     void Write_Header_Text(FILE *fp);
 
diff --git a/src/main.cpp b/src/main.cpp
index 48dd32c70..9e59bd651 100644
--- a/src/main.cpp
+++ b/src/main.cpp
@@ -22,6 +22,9 @@
 #ifdef STAR_FORMATION
 #include "particles/star_formation.h"
 #endif
+#ifdef  MHD
+#include "mhd/magnetic_divergence.h"
+#endif  //MHD
 
 #include "grid/grid_enum.h"
 
@@ -193,7 +196,7 @@ int main(int argc, char *argv[])
 
   #ifdef  MHD
     // Check that the initial magnetic field has zero divergence
-    G.checkMagneticDivergence();
+    mhd::checkMagneticDivergence(G);
   #endif  //MHD
 
   // increment the next output time
@@ -339,7 +342,7 @@ int main(int argc, char *argv[])
 
     #ifdef  MHD
       // Check that the magnetic field has zero divergence
-      G.checkMagneticDivergence();
+      mhd::checkMagneticDivergence(G);
     #endif  //MHD
   } /*end loop over timesteps*/
 
diff --git a/src/mhd/magnetic_divergence.cu b/src/mhd/magnetic_divergence.cu
index 642cba86d..b41185d43 100644
--- a/src/mhd/magnetic_divergence.cu
+++ b/src/mhd/magnetic_divergence.cu
@@ -81,10 +81,9 @@ namespace mhd
         reduction_utilities::gridReduceMax(maxDivergence, dev_maxDivergence);
     }
     // =========================================================================
-} // end namespace mhd
 
 // =============================================================================
-void Grid3D::checkMagneticDivergence()
+Real checkMagneticDivergence(Grid3D const &G)
 {
     // Compute the local value of the divergence
     // First let's create some variables we'll need.
@@ -99,35 +98,39 @@ void Grid3D::checkMagneticDivergence()
     // Now lets get the local maximum divergence
     hipLaunchKernelGGL(mhd::calculateMagneticDivergence,
                         launchParams.numBlocks, launchParams.threadsPerBlock, 0, 0,
-                        C.device, dev_maxDivergence.data(),
-                        H.dx, H.dy, H.dz,
-                        H.nx, H.ny, H.nz,
-                        H.n_cells);
+                        G.C.device, dev_maxDivergence.data(),
+                        G.H.dx, G.H.dy, G.H.dz,
+                        G.H.nx, G.H.ny, G.H.nz,
+                        G.H.n_cells);
     CudaCheckError();
-    H.max_magnetic_divergence = dev_maxDivergence[0];
+    Real max_magnetic_divergence = dev_maxDivergence[0];
 
     #ifdef  MPI_CHOLLA
     // Now that we have the local maximum let's get the global maximum
-    H.max_magnetic_divergence = ReduceRealMax(H.max_magnetic_divergence);
+    max_magnetic_divergence = ReduceRealMax(max_magnetic_divergence);
     #endif  //MPI_CHOLLA
 
     // If the magnetic divergence is greater than the limit then raise a warning and exit
-    if (H.max_magnetic_divergence > H.magnetic_divergence_limit)
+    Real static const magnetic_divergence_limit = 1.0E-14;
+    if (max_magnetic_divergence > magnetic_divergence_limit)
     {
         // Report the error and exit
-        chprintf("The magnetic divergence has exceeded the maximum allowed value. Divergence = %7.4e, the maximum allowed divergence = %7.4e\n", H.max_magnetic_divergence, H.magnetic_divergence_limit);
+        chprintf("The magnetic divergence has exceeded the maximum allowed value. Divergence = %7.4e, the maximum allowed divergence = %7.4e\n", max_magnetic_divergence, magnetic_divergence_limit);
         chexit(-1);
     }
-    else if (H.max_magnetic_divergence < 0.0)
+    else if (max_magnetic_divergence < 0.0)
     {
         // Report the error and exit
-        chprintf("The magnetic divergence is negative. Divergence = %7.4e\n", H.max_magnetic_divergence);
+        chprintf("The magnetic divergence is negative. Divergence = %7.4e\n", max_magnetic_divergence);
         chexit(-1);
     }
     else  // The magnetic divergence is within acceptable bounds
     {
-        chprintf("Global maximum magnetic divergence = %7.4e\n", H.max_magnetic_divergence);
+        chprintf("Global maximum magnetic divergence = %7.4e\n", max_magnetic_divergence);
     }
+
+    return max_magnetic_divergence;
 }
 // =============================================================================
+} // end namespace mhd
 #endif // MHD
diff --git a/src/mhd/magnetic_divergence.h b/src/mhd/magnetic_divergence.h
index 304bf0823..a32c7ec74 100644
--- a/src/mhd/magnetic_divergence.h
+++ b/src/mhd/magnetic_divergence.h
@@ -14,6 +14,7 @@
 
 // Local Includes
 #include "../global/global.h"
+#include "../grid/grid3D.h"
 #include "../global/global_cuda.h"
 #include "../utils/gpu.hpp"
 
@@ -51,4 +52,19 @@ namespace mhd
                                                 int const nz,
                                                 int const n_cells);
     // =========================================================================
+
+    // =========================================================================
+    /*!
+     * \brief Compute the maximum magnetic divergence in the grid and report
+     * an error if it exceeds the magnetic divergence limit or is negative. The
+     * magnetic divergence limit is 1E-14 as determined by Athena as a
+     * reasonable upper bound for correctness.
+     *
+     * \param G The grid object
+     * \return Real The maximum magnetic divergence found in the grid. Can
+     * usually be ignored since all checking is done in the fucntion, mostly
+     * this return is for testing.
+     */
+    Real checkMagneticDivergence(Grid3D const &G);
+    // =========================================================================
 } // end namespace mhd
\ No newline at end of file
diff --git a/src/mhd/magnetic_divergence_tests.cu b/src/mhd/magnetic_divergence_tests.cu
index 3b1704aad..509d9af30 100644
--- a/src/mhd/magnetic_divergence_tests.cu
+++ b/src/mhd/magnetic_divergence_tests.cu
@@ -17,7 +17,6 @@
 
 // Local Includes
 #include "../utils/testing_utilities.h"
-#include "../grid/grid3D.h"
 #include "../mhd/magnetic_divergence.h"
 #include "../utils/DeviceVector.h"
 #include "../global/global.h"
@@ -60,11 +59,11 @@ TEST(tMHDGrid3DcheckMagneticDivergence, CorrectInputExpectCorrectOutput)
 
     // Perform test
     InitializeChollaMPI(NULL, NULL);
-    G.checkMagneticDivergence();
+    double max_magnetic_divergence = mhd::checkMagneticDivergence(G);
     MPI_Finalize();
     // Perform Comparison
     Real const fiducialDivergence = 3.6318132783263106 / 1E15;
-    testingUtilities::checkResults(fiducialDivergence, G.H.max_magnetic_divergence, "maximum divergence");
+    testingUtilities::checkResults(fiducialDivergence, max_magnetic_divergence, "maximum divergence");
 }
 // =============================================================================
 // End of tests for the magnetic field divergence functions

From bfe2198d54f8aff433e673420e8f1ceb4ec743b9 Mon Sep 17 00:00:00 2001
From: Bob Caddy <r.Caddy@pitt.edu>
Date: Thu, 5 Jan 2023 11:48:38 -0500
Subject: [PATCH 12/18] Cell centered B fields now use structered binding

`mhd::utils::cellCenteredMagneticFields` now returns the centered
magnetic fields using structured binding so the resultant values can be
declared const.
---
 src/hydro/hydro_cuda.cu                       | 13 +++--------
 src/integrators/VL_3D_cuda.cu                 |  3 +--
 src/reconstruction/pcm_cuda.cu                |  6 ++---
 ...zedMpi_CorrectInputExpectCorrectOutput.txt |  2 +-
 src/utils/gpu.hpp                             |  1 -
 src/utils/mhd_utilities.h                     | 23 ++++++++++++-------
 src/utils/mhd_utilities_tests.cu              |  3 +--
 7 files changed, 23 insertions(+), 28 deletions(-)

diff --git a/src/hydro/hydro_cuda.cu b/src/hydro/hydro_cuda.cu
index 3b60f97f9..e6b110ffc 100644
--- a/src/hydro/hydro_cuda.cu
+++ b/src/hydro/hydro_cuda.cu
@@ -524,9 +524,6 @@ __global__ void Calc_dt_3D(Real *dev_conserved, Real *dev_dti, Real gamma, int n
   Real max_dti = -DBL_MAX;
 
   Real d, d_inv, vx, vy, vz, E;
-  #ifdef  MHD
-    Real avgBx, avgBy, avgBz;
-  #endif  //MHD
   int xid, yid, zid, n_cells;
 
   n_cells = nx*ny*nz;
@@ -554,7 +551,7 @@ __global__ void Calc_dt_3D(Real *dev_conserved, Real *dev_dti, Real gamma, int n
       #ifdef  MHD
         // Compute the cell centered magnetic field using a straight average of
         // the faces
-        mhd::utils::cellCenteredMagneticFields(dev_conserved, id, xid, yid, zid, n_cells, nx, ny, avgBx, avgBy, avgBz);
+        auto const [avgBx, avgBy, avgBz] = mhd::utils::cellCenteredMagneticFields(dev_conserved, id, xid, yid, zid, n_cells, nx, ny);
       #endif  //MHD
 
       // Compute the maximum inverse crossing time in the cell
@@ -631,9 +628,6 @@ __global__ void Average_Slow_Cells_3D(Real *dev_conserved, int nx, int ny, int n
   int id, xid, yid, zid, n_cells;
   Real d, d_inv, vx, vy, vz, E, max_dti;
   Real speed, temp, P, cs;
-  #ifdef  MHD
-    Real avgBx, avgBy, avgBz;
-  #endif  //MHD
 
   // get a global thread ID
   id = threadIdx.x + blockIdx.x * blockDim.x;
@@ -654,7 +648,7 @@ __global__ void Average_Slow_Cells_3D(Real *dev_conserved, int nx, int ny, int n
 
     #ifdef  MHD
       // Compute the cell centered magnetic field using a straight average of the faces
-      mhdUtils::cellCenteredMagneticFields(dev_conserved, id, xid, yid, zid, n_cells, nx, ny, avgBx, avgBy, avgBz);
+      auto [avgBx, avgBy, avgBz] = mhdUtils::cellCenteredMagneticFields(dev_conserved, id, xid, yid, zid, n_cells, nx, ny);
     #endif  //MHD
 
     // Compute the maximum inverse crossing time in the cell
@@ -813,8 +807,7 @@ __global__ void Partial_Update_Advected_Internal_Energy_3D( Real *dev_conserved,
     E_kin = hydro_utilities::Calc_Kinetic_Energy_From_Velocity(d, vx, vy, vz);
     #ifdef  MHD
       // Add the magnetic energy
-      Real centeredBx, centeredBy, centeredBz;
-      mhd::utils::cellCenteredMagneticFields(dev_conserved, id, xid, yid, zid, n_cells, nx, ny, centeredBx, centeredBy, centeredBz)
+      auto [centeredBx, centeredBy, centeredBz] = mhd::utils::cellCenteredMagneticFields(dev_conserved, id, xid, yid, zid, n_cells, nx, ny)
       E_kin += mhd::utils::computeMagneticEnergy(magX, magY, magZ);
     #endif  //MHD
     P = hydro_utilities::Get_Pressure_From_DE( E, E - E_kin, GE, gamma );
diff --git a/src/integrators/VL_3D_cuda.cu b/src/integrators/VL_3D_cuda.cu
index 1f9a6a459..f007b6ce3 100644
--- a/src/integrators/VL_3D_cuda.cu
+++ b/src/integrators/VL_3D_cuda.cu
@@ -331,8 +331,7 @@ __global__ void Update_Conserved_Variables_3D_half(Real *dev_conserved, Real *de
     E_kin = hydro_utilities::Calc_Kinetic_Energy_From_Velocity(d, vx, vy, vz);
     #ifdef  MHD
       // Add the magnetic energy
-      Real centeredBx, centeredBy, centeredBz;
-      mhd::utils::cellCenteredMagneticFields(dev_conserved, id, xid, yid, zid, n_cells, nx, ny, centeredBx, centeredBy, centeredBz)
+      auto const [centeredBx, centeredBy, centeredBz] = mhd::utils::cellCenteredMagneticFields(dev_conserved, id, xid, yid, zid, n_cells, nx, ny)
       E_kin += mhd::utils::computeMagneticEnergy(centeredBx, centeredBy, centeredBz);
     #endif  //MHD
     P = hydro_utilities::Get_Pressure_From_DE( E, E - E_kin, GE, gamma );
diff --git a/src/reconstruction/pcm_cuda.cu b/src/reconstruction/pcm_cuda.cu
index 4998dcd92..e6d48999a 100644
--- a/src/reconstruction/pcm_cuda.cu
+++ b/src/reconstruction/pcm_cuda.cu
@@ -299,10 +299,8 @@ __global__ void PCM_Reconstruction_3D(Real *dev_conserved,
       }
     #endif  //SCALAR
     #ifdef  MHD
-      Real cellCenteredBx, cellCenteredBy, cellCenteredBz;
-      mhd::utils::cellCenteredMagneticFields(dev_conserved,
-                                           id, xid, yid, zid, n_cells, nx, ny,
-                                           cellCenteredBx, cellCenteredBy, cellCenteredBz);
+      auto const [cellCenteredBx, cellCenteredBy, cellCenteredBz] = mhd::utils::cellCenteredMagneticFields(dev_conserved,
+                                           id, xid, yid, zid, n_cells, nx, ny);
     #endif  //MHD
     #ifdef DE
       Real const ge = dev_conserved[(n_fields-1)*n_cells + id];
diff --git a/src/system_tests/input_files/tMHDSYSTEMSodShockTubeParameterizedMpi_CorrectInputExpectCorrectOutput.txt b/src/system_tests/input_files/tMHDSYSTEMSodShockTubeParameterizedMpi_CorrectInputExpectCorrectOutput.txt
index 6fb66732b..71dd9bd91 100644
--- a/src/system_tests/input_files/tMHDSYSTEMSodShockTubeParameterizedMpi_CorrectInputExpectCorrectOutput.txt
+++ b/src/system_tests/input_files/tMHDSYSTEMSodShockTubeParameterizedMpi_CorrectInputExpectCorrectOutput.txt
@@ -1,5 +1,5 @@
 #
-# Parameter File for 1D Sod Shock tube
+# Parameter File for 3D Sod Shock tube
 #
 
 ################################################
diff --git a/src/utils/gpu.hpp b/src/utils/gpu.hpp
index 66f2885f2..461f9821b 100644
--- a/src/utils/gpu.hpp
+++ b/src/utils/gpu.hpp
@@ -53,7 +53,6 @@ static constexpr int maxWarpsPerBlock = 1024/WARPSIZE;
 #define cudaMemcpy hipMemcpy
 #define cudaMemcpyAsync hipMemcpyAsync
 #define cudaMemcpyPeer hipMemcpyPeer
-#define cudaMemcpyPeer hipMemcpyPeer
 #define cudaMemcpyDeviceToHost hipMemcpyDeviceToHost
 #define cudaMemcpyDeviceToDevice hipMemcpyDeviceToDevice
 #define cudaMemcpyHostToDevice hipMemcpyHostToDevice
diff --git a/src/utils/mhd_utilities.h b/src/utils/mhd_utilities.h
index 6b587e535..ef64b9536 100644
--- a/src/utils/mhd_utilities.h
+++ b/src/utils/mhd_utilities.h
@@ -298,32 +298,39 @@ namespace utils{
      * \param[out] avgBx The cell centered average magnetic field in the x-direction
      * \param[out] avgBy The cell centered average magnetic field in the y-direction
      * \param[out] avgBz The cell centered average magnetic field in the z-direction
+     *
+     * \return Real local struct with the X, Y, and Z cell centered magnetic
+     * fields. Intended to be called with structured binding like `auto [x, y,
+     * z] = mhd::utils::cellCenteredMagneticFields(*args*)
      */
-    inline __host__ __device__ void cellCenteredMagneticFields(Real const *dev_conserved,
+    inline __host__ __device__ auto cellCenteredMagneticFields(Real const *dev_conserved,
                                                                size_t const &id,
                                                                size_t const &xid,
                                                                size_t const &yid,
                                                                size_t const &zid,
                                                                size_t const &n_cells,
                                                                size_t const &nx,
-                                                               size_t const &ny,
-                                                               Real &avgBx,
-                                                               Real &avgBy,
-                                                               Real &avgBz)
+                                                               size_t const &ny)
     {
         // Ternary operator to check that no values outside of the magnetic field
         // arrays are loaded. If the cell is on the edge that doesn't have magnetic
         // fields on both sides then instead set the centered magnetic field to be
         // equal to the magnetic field of the closest edge. T
-        avgBx = (xid > 0) ?
+        Real avgBx = (xid > 0) ?
             /*if true*/ 0.5 * (dev_conserved[(grid_enum::magnetic_x)*n_cells + id] + dev_conserved[(grid_enum::magnetic_x)*n_cells + cuda_utilities::compute1DIndex(xid-1, yid,   zid,   nx, ny)]):
             /*if false*/       dev_conserved[(grid_enum::magnetic_x)*n_cells + id];
-        avgBy = (yid > 0) ?
+        Real avgBy = (yid > 0) ?
             /*if true*/ 0.5 * (dev_conserved[(grid_enum::magnetic_y)*n_cells + id] + dev_conserved[(grid_enum::magnetic_y)*n_cells + cuda_utilities::compute1DIndex(xid,   yid-1, zid,   nx, ny)]):
             /*if false*/       dev_conserved[(grid_enum::magnetic_y)*n_cells + id];
-        avgBz = (zid > 0) ?
+        Real avgBz = (zid > 0) ?
             /*if true*/ 0.5 * (dev_conserved[(grid_enum::magnetic_z)*n_cells + id] + dev_conserved[(grid_enum::magnetic_z)*n_cells + cuda_utilities::compute1DIndex(xid,   yid,   zid-1, nx, ny)]):
             /*if false*/       dev_conserved[(grid_enum::magnetic_z)*n_cells + id];
+
+        struct returnStruct
+        {
+            Real x, y, z;
+        };
+        return returnStruct{avgBx, avgBy, avgBz};
     }
     #endif // MHD
     // =========================================================================
diff --git a/src/utils/mhd_utilities_tests.cu b/src/utils/mhd_utilities_tests.cu
index d07b690d4..83500c68f 100644
--- a/src/utils/mhd_utilities_tests.cu
+++ b/src/utils/mhd_utilities_tests.cu
@@ -527,10 +527,9 @@ TEST(tMHDCellCenteredMagneticFields,
     double const fiducialAvgBx = 637.5,
                  fiducialAvgBy = 761.5,
                  fiducialAvgBz = 883.5;
-    double testAvgBx, testAvgBy, testAvgBz;
 
     // Call the function to test
-    mhd::utils::cellCenteredMagneticFields(testGrid.data(), id, xid, yid, zid, n_cells, nx, ny, testAvgBx, testAvgBy, testAvgBz);
+    auto [testAvgBx, testAvgBy, testAvgBz] = mhd::utils::cellCenteredMagneticFields(testGrid.data(), id, xid, yid, zid, n_cells, nx, ny);
 
     // Check the results
     testingUtilities::checkResults(fiducialAvgBx, testAvgBx, "cell centered Bx value");

From 05f086eeac36c03e4fad182b9853e7a698b634c1 Mon Sep 17 00:00:00 2001
From: Bob Caddy <r.Caddy@pitt.edu>
Date: Thu, 5 Jan 2023 12:00:14 -0500
Subject: [PATCH 13/18] Fix threadguard in magnetic field update

---
 src/mhd/magnetic_update.cu       | 6 +++---
 src/mhd/magnetic_update_tests.cu | 8 ++++----
 2 files changed, 7 insertions(+), 7 deletions(-)

diff --git a/src/mhd/magnetic_update.cu b/src/mhd/magnetic_update.cu
index 550fb7188..28a1d9465 100644
--- a/src/mhd/magnetic_update.cu
+++ b/src/mhd/magnetic_update.cu
@@ -36,9 +36,9 @@ namespace mhd
 
         // Thread guard to avoid overrun and to skip ghost cells that cannot be
         // evolved due to missing electric fields that can't be reconstructed
-        if (    xid < nx-1
-            and yid < ny-1
-            and zid < nz-1)
+        if (    xid < nx-2
+            and yid < ny-2
+            and zid < nz-2)
         {
             // Compute the three dt/dx quantities
             Real const dtodx = dt/dx;
diff --git a/src/mhd/magnetic_update_tests.cu b/src/mhd/magnetic_update_tests.cu
index 501803e1c..f4d0d44a0 100644
--- a/src/mhd/magnetic_update_tests.cu
+++ b/src/mhd/magnetic_update_tests.cu
@@ -36,7 +36,7 @@ public:
     */
     tMHDUpdateMagneticField3D()
         :
-        nx(2),
+        nx(3),
         ny(nx),
         nz(nx),
         n_cells(nx*ny*nz),
@@ -141,9 +141,9 @@ TEST_F(tMHDUpdateMagneticField3D,
        CorrectInputExpectCorrectOutput)
 {
     // Fiducial values
-    fiducialData.at(40) = 42.559999999999995;
-    fiducialData.at(48) = 44.160000000000004;
-    fiducialData.at(56) = 57.280000000000001;
+    fiducialData.at(135) = 142.68000000000001;
+    fiducialData.at(162) = 151.75999999999999;
+    fiducialData.at(189) = 191.56;
 
     // Launch kernel and check results
     runTest();

From 1c50a705a9e7b2263ed28df17e3259ece782ab92 Mon Sep 17 00:00:00 2001
From: Bob Caddy <r.Caddy@pitt.edu>
Date: Thu, 5 Jan 2023 12:02:43 -0500
Subject: [PATCH 14/18] Fix copy-pasted comment

---
 src/mhd/magnetic_divergence.cu | 5 ++---
 1 file changed, 2 insertions(+), 3 deletions(-)

diff --git a/src/mhd/magnetic_divergence.cu b/src/mhd/magnetic_divergence.cu
index b41185d43..447e11163 100644
--- a/src/mhd/magnetic_divergence.cu
+++ b/src/mhd/magnetic_divergence.cu
@@ -90,9 +90,8 @@ Real checkMagneticDivergence(Grid3D const &G)
     cuda_utilities::AutomaticLaunchParams static const launchParams(mhd::calculateMagneticDivergence);
     cuda_utilities::DeviceVector<Real> static dev_maxDivergence(1);
 
-    // Set the device side inverse time step to the smallest possible double
-    // so that the reduction isn't using the maximum value of the previous
-    // iteration
+    // Set the device side divergence to the smallest possible double so that
+    // the reduction isn't using the maximum value of the previous iteration
     dev_maxDivergence.assign(std::numeric_limits<Real>::lowest());
 
     // Now lets get the local maximum divergence

From 0be3a500582afec7a193745bddaf186b73c2c1f5 Mon Sep 17 00:00:00 2001
From: Bob Caddy <r.Caddy@pitt.edu>
Date: Thu, 5 Jan 2023 15:44:05 -0500
Subject: [PATCH 15/18] Add citations in comments

---
 src/integrators/VL_3D_cuda.cu    |  5 ++++-
 src/mhd/ct_electric_fields.cu    | 31 +++++++++++++++-----------
 src/mhd/ct_electric_fields.h     | 10 ++++++---
 src/mhd/magnetic_divergence.cu   |  5 ++++-
 src/mhd/magnetic_update.cu       |  7 +++++-
 src/mhd/magnetic_update.h        |  4 +++-
 src/riemann_solvers/hlld_cuda.cu | 37 +++++++++++++++++++++++++++-----
 src/riemann_solvers/hlld_cuda.h  | 14 +++++++-----
 8 files changed, 83 insertions(+), 30 deletions(-)

diff --git a/src/integrators/VL_3D_cuda.cu b/src/integrators/VL_3D_cuda.cu
index f007b6ce3..9a9ee6cb1 100644
--- a/src/integrators/VL_3D_cuda.cu
+++ b/src/integrators/VL_3D_cuda.cu
@@ -1,5 +1,8 @@
 /*! \file VL_3D_cuda.cu
- *  \brief Definitions of the cuda 3 D VL algorithm functions. */
+ *  \brief Definitions of the cuda 3 D VL algorithm functions. MHD algorithm
+ *  from Stone & Gardiner 2009 "A simple unsplit Godunov method for
+ *  multidimensional MHD"
+ */
 
 #if  defined(CUDA) && defined(VL)
 
diff --git a/src/mhd/ct_electric_fields.cu b/src/mhd/ct_electric_fields.cu
index cd90ae2ac..aa0ac3061 100644
--- a/src/mhd/ct_electric_fields.cu
+++ b/src/mhd/ct_electric_fields.cu
@@ -1,7 +1,9 @@
 /*!
  * \file ct_electric_fields.cu
  * \author Robert 'Bob' Caddy (rvc@pitt.edu)
- * \brief Contains implementation for the CT electric fields code
+ * \brief Contains implementation for the CT electric fields code. Method from
+ * Stone & Gardiner 2009 "A simple unsplit Godunov method for multidimensional
+ * MHD" hereafter referred to as "S&G 2009"
  *
  */
 
@@ -80,7 +82,7 @@ namespace mhd
             // X electric field
             // ================
 
-            // Y-direction slope on the positive Y side
+            // Y-direction slope on the positive Y side. S&G 2009 equation 23
             signUpwind = fluxZ[cuda_utilities::compute1DIndex(xid, yid, zid-1, nx, ny)];
             if (signUpwind > 0.0)
             {
@@ -96,7 +98,7 @@ namespace mhd
                                    + mhd::_internal::_ctSlope(fluxY, dev_conserved, -1, 0, -1, -1, 1, -1, xid, yid, zid, nx, ny, n_cells));
             }
 
-            // Y-direction slope on the negative Y side
+            // Y-direction slope on the negative Y side. S&G 2009 equation 23
             signUpwind = fluxZ[cuda_utilities::compute1DIndex(xid, yid-1, zid-1, nx, ny)];
             if (signUpwind > 0.0)
             {
@@ -112,7 +114,7 @@ namespace mhd
                                    + mhd::_internal::_ctSlope(fluxY, dev_conserved, -1, 0, 1, -1, 1, -1, xid, yid, zid, nx, ny, n_cells));
             }
 
-            // Z-direction slope on the positive Z side
+            // Z-direction slope on the positive Z side. S&G 2009 equation 23
             signUpwind = fluxY[cuda_utilities::compute1DIndex(xid, yid-1, zid, nx, ny)];
             if (signUpwind > 0.0)
             {
@@ -128,7 +130,7 @@ namespace mhd
                                    + mhd::_internal::_ctSlope(fluxZ, dev_conserved, 1, 0, -1, -1, 2, -1, xid, yid, zid, nx, ny, n_cells));
             }
 
-            // Z-direction slope on the negative Z side
+            // Z-direction slope on the negative Z side. S&G 2009 equation 23
             signUpwind = fluxY[cuda_utilities::compute1DIndex(xid, yid-1, zid-1, nx, ny)];
             if (signUpwind > 0.0)
             {
@@ -154,6 +156,7 @@ namespace mhd
 
             // sum and average face centered electric fields and slopes to get the
             // edge averaged electric field.
+            // S&G 2009 equation 22
             ctElectricFields[threadId + 0*n_cells] = 0.25 * (+ face_y_pos
                                                              + face_y_neg
                                                              + face_z_pos
@@ -167,7 +170,7 @@ namespace mhd
             // Y electric field
             // ================
 
-            // X-direction slope on the positive X side
+            // X-direction slope on the positive X side. S&G 2009 equation 23
             signUpwind = fluxZ[cuda_utilities::compute1DIndex(xid, yid, zid-1, nx, ny)];
             if (signUpwind > 0.0)
             {
@@ -183,7 +186,7 @@ namespace mhd
                                    + mhd::_internal::_ctSlope(fluxX, dev_conserved, 1, 1, -1, -1, 0, -1, xid, yid, zid, nx, ny, n_cells));
             }
 
-            // X-direction slope on the negative X side
+            // X-direction slope on the negative X side. S&G 2009 equation 23
             signUpwind = fluxZ[cuda_utilities::compute1DIndex(xid-1, yid, zid-1, nx, ny)];
             if (signUpwind > 0.0)
             {
@@ -199,7 +202,7 @@ namespace mhd
                                    + mhd::_internal::_ctSlope(fluxX, dev_conserved, 1, 1, 0, -1, 0, -1, xid, yid, zid, nx, ny, n_cells));
             }
 
-            // Z-direction slope on the positive Z side
+            // Z-direction slope on the positive Z side. S&G 2009 equation 23
             signUpwind = fluxX[cuda_utilities::compute1DIndex(xid-1, yid, zid, nx, ny)];
             if (signUpwind > 0.0)
             {
@@ -215,7 +218,7 @@ namespace mhd
                                    + mhd::_internal::_ctSlope(fluxZ, dev_conserved, -1, 1, -1, -1, 2, -1, xid, yid, zid, nx, ny, n_cells));
             }
 
-            // Z-direction slope on the negative Z side
+            // Z-direction slope on the negative Z side. S&G 2009 equation 23
             signUpwind = fluxX[cuda_utilities::compute1DIndex(xid-1, yid, zid-1, nx, ny)];
             if (signUpwind > 0.0)
             {
@@ -240,6 +243,7 @@ namespace mhd
 
             // sum and average face centered electric fields and slopes to get the
             // edge averaged electric field.
+            // S&G 2009 equation 22
             ctElectricFields[threadId + 1*n_cells] = 0.25 * (+ face_x_pos
                                                              + face_x_neg
                                                              + face_z_pos
@@ -253,7 +257,7 @@ namespace mhd
             // Z electric field
             // ================
 
-            // Y-direction slope on the positive Y side
+            // Y-direction slope on the positive Y side. S&G 2009 equation 23
             signUpwind = fluxX[cuda_utilities::compute1DIndex(xid-1, yid, zid, nx, ny)];
             if (signUpwind > 0.0)
             {
@@ -269,7 +273,7 @@ namespace mhd
                                    + mhd::_internal::_ctSlope(fluxY, dev_conserved, 1, 2, -1, -1, 1, -1, xid, yid, zid, nx, ny, n_cells));
             }
 
-            // Y-direction slope on the negative Y side
+            // Y-direction slope on the negative Y side. S&G 2009 equation 23
             signUpwind = fluxX[cuda_utilities::compute1DIndex(xid-1, yid-1, zid, nx, ny)];
             if (signUpwind > 0.0)
             {
@@ -285,7 +289,7 @@ namespace mhd
                                    + mhd::_internal::_ctSlope(fluxY, dev_conserved, 1, 2, 1, -1, 1, -1, xid, yid, zid, nx, ny, n_cells));
             }
 
-            // X-direction slope on the positive X side
+            // X-direction slope on the positive X side. S&G 2009 equation 23
             signUpwind = fluxY[cuda_utilities::compute1DIndex(xid, yid-1, zid, nx, ny)];
             if (signUpwind > 0.0)
             {
@@ -301,7 +305,7 @@ namespace mhd
                                    + mhd::_internal::_ctSlope(fluxX, dev_conserved, -1, 2, -1, -1, 0, -1, xid, yid, zid, nx, ny, n_cells));
             }
 
-            // X-direction slope on the negative X side
+            // X-direction slope on the negative X side. S&G 2009 equation 23
             signUpwind = fluxY[cuda_utilities::compute1DIndex(xid-1, yid-1, zid, nx, ny)];
             if (signUpwind > 0.0)
             {
@@ -326,6 +330,7 @@ namespace mhd
 
             // sum and average face centered electric fields and slopes to get the
             // edge averaged electric field.
+            // S&G 2009 equation 22
             ctElectricFields[threadId + 2*n_cells] = 0.25 * (+ face_x_pos
                                                              + face_x_neg
                                                              + face_y_pos
diff --git a/src/mhd/ct_electric_fields.h b/src/mhd/ct_electric_fields.h
index 3db5927ad..9ba8780ee 100644
--- a/src/mhd/ct_electric_fields.h
+++ b/src/mhd/ct_electric_fields.h
@@ -1,7 +1,9 @@
 /*!
  * \file ct_electric_fields.h
  * \author Robert 'Bob' Caddy (rvc@pitt.edu)
- * \brief Contains the declaration for the kernel that computes the CT electric fields
+ * \brief Contains the declaration for the kernel that computes the CT electric
+ * fields. Method from Stone & Gardiner 2009 "A simple unsplit Godunov method
+ * for multidimensional MHD" hereafter referred to as "S&G 2009"
  *
  */
 
@@ -31,7 +33,8 @@ namespace mhd
         // =====================================================================
         /*!
          * \brief Compute and return the slope of the electric field used to
-           compute the CT electric fields
+         * compute the CT electric fields. This function implements S&G 2009
+         * equation 24
          *
          * \param[in] flux The flux array
          * \param[in] dev_conserved The conserved variable array
@@ -118,10 +121,11 @@ namespace mhd
             Real const electric_face = fluxSign * flux[idxFlux + (int(fluxSign == 1)+grid_enum::magnetic_start)*n_cells];
 
             // Compute the slope and return it
+            // S&G 2009 equation 24
             return electric_face - electric_centered;
         }
         // =====================================================================
-    }// _mhd_internal namespace
+    }// mhd::_internal namespace
 
     // =========================================================================
     /*!
diff --git a/src/mhd/magnetic_divergence.cu b/src/mhd/magnetic_divergence.cu
index 447e11163..fc84cbb3f 100644
--- a/src/mhd/magnetic_divergence.cu
+++ b/src/mhd/magnetic_divergence.cu
@@ -5,7 +5,9 @@
  * for the various kernels, functions, and tools required for the 3D VL+CT MHD
  * integrator. Due to the CUDA/HIP compiler requiring that device functions be
  * directly accessible to the file they're used in most device functions will be
- * implemented in the header file
+ * implemented in the header file. Uses the same method described in Stone et
+ * al. 2008 "ATHENA: A new code for astrophysical MHD", hereafter referred to as
+ * Stone et al. 2008
  *
  */
 
@@ -62,6 +64,7 @@ namespace mhd
                 id_zMin1 = cuda_utilities::compute1DIndex(xid  , yid  , zid-1, nx, ny);
 
                 // Compute divergence
+                // Stone et al. 2008 equation 25
                 cellDivergence =
                     ((   dev_conserved[id       + (grid_enum::magnetic_x)*n_cells]
                        - dev_conserved[id_xMin1 + (grid_enum::magnetic_x)*n_cells])
diff --git a/src/mhd/magnetic_update.cu b/src/mhd/magnetic_update.cu
index 28a1d9465..541fb83ba 100644
--- a/src/mhd/magnetic_update.cu
+++ b/src/mhd/magnetic_update.cu
@@ -1,7 +1,9 @@
 /*!
  * \file magnetic_update.cu
  * \author Robert 'Bob' Caddy (rvc@pitt.edu)
- * \brief Contains the definition of the kernel to update the magnetic field
+ * \brief Contains the definition of the kernel to update the magnetic field.
+ * Method from Stone & Gardiner 2009 "A simple unsplit Godunov method for
+ * multidimensional MHD" hereafter referred to as "S&G 2009"
  *
  */
 
@@ -61,16 +63,19 @@ namespace mhd
             // Perform Updates
 
             // X field update
+            // S&G 2009 equation 10
             destinationGrid[threadId + (grid_enum::magnetic_x)*n_cells] = sourceGrid[threadId + (grid_enum::magnetic_x)*n_cells]
                 + dtodz * (electric_y_3 - electric_y_1)
                 + dtody * (electric_z_1 - electric_z_3);
 
             // Y field update
+            // S&G 2009 equation 11
             destinationGrid[threadId + (grid_enum::magnetic_y)*n_cells] = sourceGrid[threadId + (grid_enum::magnetic_y)*n_cells]
                 + dtodx * (electric_z_3 - electric_z_2)
                 + dtodz * (electric_x_1 - electric_x_3);
 
             // Z field update
+            // S&G 2009 equation 12
             destinationGrid[threadId + (grid_enum::magnetic_z)*n_cells] = sourceGrid[threadId + (grid_enum::magnetic_z)*n_cells]
                 + dtody * (electric_x_3 - electric_x_2)
                 + dtodx * (electric_y_2 - electric_y_3);
diff --git a/src/mhd/magnetic_update.h b/src/mhd/magnetic_update.h
index 2c89e26ba..4b71689b6 100644
--- a/src/mhd/magnetic_update.h
+++ b/src/mhd/magnetic_update.h
@@ -1,7 +1,9 @@
 /*!
  * \file magnetic_update.h
  * \author Robert 'Bob' Caddy (rvc@pitt.edu)
- * \brief Contains the declaration of the kernel to update the magnetic field
+ * \brief Contains the declaration of the kernel to update the magnetic field.
+ * Method from Stone & Gardiner 2009 "A simple unsplit Godunov method for
+ * multidimensional MHD" hereafter referred to as "S&G 2009"
  *
  */
 
diff --git a/src/riemann_solvers/hlld_cuda.cu b/src/riemann_solvers/hlld_cuda.cu
index a7793150b..8b5ac667e 100644
--- a/src/riemann_solvers/hlld_cuda.cu
+++ b/src/riemann_solvers/hlld_cuda.cu
@@ -1,7 +1,9 @@
 /*!
  * \file hlld_cuda.cu
  * \author Robert 'Bob' Caddy (rvc@pitt.edu)
- * \brief Contains the implementation of the HLLD solver
+ * \brief Contains the implementation of the HLLD solver from Miyoshi & Kusano 2005
+ * "A multi-state HLL approximate Riemann solver for ideal magnetohydrodynamics",
+ * hereafter referred to as M&K 2005
  *
 */
 
@@ -241,6 +243,7 @@ namespace mhd
 
             // If we're in the L state then assign fluxes and return.
             // In this state the flow is supersonic
+            // M&K 2005 equation 66
             if (speedL >= 0.0)
             {
                 mhd::_internal::_returnFluxes(threadId, o1, o2, o3, n_cells,
@@ -282,6 +285,7 @@ namespace mhd
 
             // If we're in the R state then assign fluxes and return.
             // In this state the flow is supersonic
+            // M&K 2005 equation 66
             if (speedR <= 0.0)
             {
                 mhd::_internal::_returnFluxes(threadId, o1, o2, o3, n_cells,
@@ -307,6 +311,8 @@ namespace mhd
             // =================================================================
             // Shared quantity
             // note that velocityStarX = speedM
+            // M&K 2005 equation 23, might need to switch to eqn. 41 in the
+            // future though they should produce identical results
             Real totalPressureStar = totalPressureL + densityL
                                                       * (speedL - velocityXL)
                                                       * (speedM - velocityXL);
@@ -355,6 +361,7 @@ namespace mhd
 
             // If we're in the L* state then assign fluxes and return.
             // In this state the flow is subsonic
+            // M&K 2005 equation 66
             if (speedStarL >= 0.0)
             {
                 mhd::_internal::_returnFluxes(threadId, o1, o2, o3, n_cells,
@@ -419,6 +426,7 @@ namespace mhd
 
             // If we're in the R* state then assign fluxes and return.
             // In this state the flow is subsonic
+            // M&K 2005 equation 66
             if (speedStarR <= 0.0)
             {
                 mhd::_internal::_returnFluxes(threadId, o1, o2, o3, n_cells,
@@ -468,6 +476,7 @@ namespace mhd
                                             energyDoubleStarR);
 
             // Compute and return L** fluxes
+            // M&K 2005 equation 66
             if (speedM >= 0.0)
             {
                 Real momentumDoubleStarFluxX, momentumDoubleStarFluxY, momentumDoubleStarFluxZ,
@@ -520,6 +529,7 @@ namespace mhd
                 return;
             }
             // Compute and return R** fluxes
+            // M&K 2005 equation 66
             else if (speedStarR >= 0.0)
             {
                 Real momentumDoubleStarFluxX, momentumDoubleStarFluxY, momentumDoubleStarFluxZ,
@@ -626,11 +636,13 @@ namespace mhd
 
             // Compute the S_L and S_R wave speeds.
             // Version suggested by Miyoshi & Kusano 2005 and used in Athena
+            // M&K 2005 equation 67
             Real magSonicMax = fmax(magSonicL, magSonicR);
             speedL = fmin(velocityXL, velocityXR) - magSonicMax;
             speedR = fmax(velocityXL, velocityXR) + magSonicMax;
 
             // Compute the S_M wave speed
+            // M&K 2005 equation 38
             speedM = // Numerator
                           ( momentumXR * (speedR - velocityXR)
                           - momentumXL * (speedL - velocityXL)
@@ -641,10 +653,12 @@ namespace mhd
                           - densityL * (speedL - velocityXL));
 
             // Compute the densities in the star state
+            // M&K 2005 equation 43
             densityStarL = densityL * (speedL - velocityXL) / (speedL - speedM);
             densityStarR = densityR * (speedR - velocityXR) / (speedR - speedM);
 
             // Compute the S_L^* and S_R^* wave speeds
+            // M&K 2005 equation 51
             speedStarL = speedM - mhd::utils::alfvenSpeed(magneticX, densityStarL);
             speedStarR = speedM + mhd::utils::alfvenSpeed(magneticX, densityStarR);
         }
@@ -668,6 +682,7 @@ namespace mhd
                                                 Real &magneticFluxZ,
                                                 Real &energyFlux)
         {
+            // M&K 2005 equation 2
             densityFlux   = momentumX;
 
             momentumFluxX = momentumX * velocityX + totalPressure - magneticX * magneticX;
@@ -748,6 +763,7 @@ namespace mhd
                                              Real &magneticStarFluxZ)
         {
             // Check for and handle the degenerate case
+            // Explained at the top of page 326 in M&K 2005
             if (fabs(density * (speedSide - velocityX)
                              * (speedSide - speedM)
                              - (magneticX * magneticX))
@@ -760,22 +776,26 @@ namespace mhd
             }
             else
             {
+                // Denominator for M&K 2005 equations 44-47
                 Real const denom = density * (speedSide - velocityX)
                                            * (speedSide - speedM)
                                            - (magneticX * magneticX);
 
                 // Compute the velocity and magnetic field in the star state
+                // M&K 2005 equations 44 & 46
                 Real coef     = magneticX  * (speedM - velocityX) / denom;
                 velocityStarY = velocityY - magneticY * coef;
                 velocityStarZ = velocityZ - magneticZ * coef;
 
+                // M&K 2005 equations 45 & 47
                 Real tmpPower = (speedSide - velocityX);
-                tmpPower = tmpPower * tmpPower;
-                coef = (density * tmpPower - (magneticX * magneticX)) / denom;
+                tmpPower      = tmpPower * tmpPower;
+                coef          = (density * tmpPower - (magneticX * magneticX)) / denom;
                 magneticStarY = magneticY * coef;
                 magneticStarZ = magneticZ * coef;
             }
 
+            // M&K 2005 equation 48
             energyStar = ( energy * (speedSide - velocityX)
                         - totalPressure * velocityX
                         + totalPressureStar * speedM
@@ -784,6 +804,7 @@ namespace mhd
                         / (speedSide - speedM);
 
             // Now compute the star state fluxes
+            // M&K 2005 equations 64
             densityStarFlux   = densityFlux   + speedSide * (densityStar - density);;
             momentumStarFluxX = momentumFluxX + speedSide * (densityStar * speedM - momentumX);;
             momentumStarFluxY = momentumFluxY + speedSide * (densityStar * velocityStarY - momentumY);;
@@ -818,14 +839,16 @@ namespace mhd
                                                   Real &energyDoubleStarR)
         {
             // if Bx is zero then just return the star state
+            // Explained at the top of page 328 in M&K 2005. Essentially when
+            // magneticX is 0 this reduces to the HLLC solver
             if (magneticX < mhd::_internal::_hlldSmallNumber * totalPressureStar)
             {
                 velocityDoubleStarY = velocityStarYL;
                 velocityDoubleStarZ = velocityStarZL;
                 magneticDoubleStarY = magneticStarYL;
                 magneticDoubleStarZ = magneticStarZL;
-                energyDoubleStarL    = energyStarL;
-                energyDoubleStarR    = energyStarR;
+                energyDoubleStarL   = energyStarL;
+                energyDoubleStarR   = energyStarR;
             }
             else
             {
@@ -839,6 +862,7 @@ namespace mhd
                 // and magnetic fields along with the energy
 
                 // Double Star velocities
+                // M&K 2005 equations 59 & 60
                 velocityDoubleStarY = inverseDensities * (sqrtDL * velocityStarYL
                                       + sqrtDR * velocityStarYR
                                       + magXSign * (magneticStarYR - magneticStarYL));
@@ -847,6 +871,7 @@ namespace mhd
                                       + magXSign * (magneticStarZR - magneticStarZL));
 
                 // Double star magnetic fields
+                // M&K 2005 equations 61 & 62
                 magneticDoubleStarY = inverseDensities * (sqrtDL * magneticStarYR
                                       + sqrtDR * magneticStarYL
                                       + magXSign * (sqrtDL * sqrtDR) * (velocityStarYR - velocityStarYL));
@@ -861,6 +886,7 @@ namespace mhd
                                                                           magneticX,
                                                                           magneticDoubleStarY,
                                                                           magneticDoubleStarZ);
+                // M&K 2005 equation 63
                 energyDoubleStarL = energyStarL - sqrtDL * magXSign
                     * (math_utils::dotProduct(speedM, velocityStarYL, velocityStarZL, magneticX, magneticStarYL, magneticStarZL)
                     - velDblStarDotMagDblStar);
@@ -899,6 +925,7 @@ namespace mhd
                                                    Real &magneticDoubleStarFluxY,
                                                    Real &magneticDoubleStarFluxZ)
         {
+            // M&K 2005 equation 65
             momentumDoubleStarFluxX = momentumStarFluxX + speedStarSide * (velocityDoubleStarX - velocityStarX) * densityStar;
             momentumDoubleStarFluxY = momentumStarFluxY + speedStarSide * (velocityDoubleStarY - velocityStarY) * densityStar;
             momentumDoubleStarFluxZ = momentumStarFluxZ + speedStarSide * (velocityDoubleStarZ - velocityStarZ) * densityStar;
diff --git a/src/riemann_solvers/hlld_cuda.h b/src/riemann_solvers/hlld_cuda.h
index 357c850d6..332768f8a 100644
--- a/src/riemann_solvers/hlld_cuda.h
+++ b/src/riemann_solvers/hlld_cuda.h
@@ -1,7 +1,9 @@
 /*!
  * \file hlld_cuda.cu
  * \author Robert 'Bob' Caddy (rvc@pitt.edu)
- * \brief Contains the declaration of the HLLD solver
+ * \brief Contains the declaration of the HLLD solver from Miyoshi & Kusano 2005
+ * "A multi-state HLL approximate Riemann solver for ideal magnetohydrodynamics",
+ * hereafter referred to as M&K 2005
  *
  */
 
@@ -63,7 +65,8 @@ namespace mhd
 
         /*!
          * \brief Compute the left, right, star, and middle wave speeds. Also
-         * returns the densities in the star states
+         * returns the densities in the star states. M&K 2005 equations 38, 43,
+         * 51, and 67
          *
          * \param[in] densityL Density, left side
          * \param[in] momentumXL Momentum in the X-direction, left side
@@ -198,7 +201,8 @@ namespace mhd
                                                Real const &energyFlux);
 
         /*!
-         * \brief Compute the fluxes in the left or right star state
+         * \brief Compute the fluxes in the left or right star state. M&K 2005
+         * equations 44-48, 64
          *
          * \param[in] speedM Speed of the central wave
          * \param[in] speedSide Speed of the non-star wave on the side being computed
@@ -274,7 +278,7 @@ namespace mhd
                                              Real &magneticStarFluxZ);
 
         /*!
-         * \brief Compute the double star state
+         * \brief Compute the double star state. M&K 2005 equations 59-63
          *
          * \param[in] speedM
          * \param[in] magneticX
@@ -321,7 +325,7 @@ namespace mhd
                                                   Real &energyDoubleStarR);
 
         /*!
-         * \brief Compute the double star state fluxes
+         * \brief Compute the double star state fluxes. M&K 2005 equation 65
          *
          * \param[in] speedStarSide The star speed on the side being computed
          * \param[in] momentumStarFluxX

From ef4f4035db3db7a68df3797364d7410617a64548 Mon Sep 17 00:00:00 2001
From: Bob Caddy <r.Caddy@pitt.edu>
Date: Thu, 5 Jan 2023 15:56:36 -0500
Subject: [PATCH 16/18] More citations in comments

---
 src/integrators/VL_3D_cuda.cu | 10 +++++-----
 src/mhd/ct_electric_fields.cu | 10 +++++-----
 2 files changed, 10 insertions(+), 10 deletions(-)

diff --git a/src/integrators/VL_3D_cuda.cu b/src/integrators/VL_3D_cuda.cu
index 9a9ee6cb1..2fb413870 100644
--- a/src/integrators/VL_3D_cuda.cu
+++ b/src/integrators/VL_3D_cuda.cu
@@ -74,11 +74,11 @@ void VL_Algorithm_3D_CUDA(Real *d_conserved, Real *d_grav_potential, int nx, int
       // store in the interface on the "right" side of the cell, so the flux
       // arrays store the fluxes through the right interface
       //
-      // According to the source code of Athena, the following equation relate
-      // the magnetic flux to the face centered electric fields/EMF.
-      // -cross(V,B)x is the negative of the x-component of V cross B. Note that
-      // "X" is the direction the solver is running in this case, not
-      // necessarily the true "X".
+      // According to Stone et al. 2008 section 5.3 and the source code of
+      // Athena, the following equation relate the magnetic flux to the face
+      // centered electric fields/EMF. -cross(V,B)x is the negative of the
+      // x-component of V cross B. Note that "X" is the direction the solver is
+      // running in this case, not necessarily the true "X".
       //  F_x[(grid_enum::fluxX_magnetic_z)*n_cells] = VxBy - BxVy = -(-cross(V,B))z = -EMF_Z
       //  F_x[(grid_enum::fluxX_magnetic_y)*n_cells] = VxBz - BxVz =  (-cross(V,B))y =  EMF_Y
       //  F_y[(grid_enum::fluxY_magnetic_x)*n_cells] = VxBy - BxVy = -(-cross(V,B))z = -EMF_X
diff --git a/src/mhd/ct_electric_fields.cu b/src/mhd/ct_electric_fields.cu
index aa0ac3061..542dda3a7 100644
--- a/src/mhd/ct_electric_fields.cu
+++ b/src/mhd/ct_electric_fields.cu
@@ -41,11 +41,11 @@ namespace mhd
             and yid < ny
             and zid < nz)
         {
-            // According to the source code of Athena, the following equation
-            // relate the magnetic flux to the face centered electric
-            // fields/EMF. -cross(V,B)x is the negative of the x-component of V
-            // cross B. Note that "X" is the direction the solver is running in
-            // this case, not necessarily the true "X".
+            // According to Stone et al. 2008 section 5.3 and the source code of
+            // Athena, the following equation relate the magnetic flux to the
+            // face centered electric fields/EMF. -cross(V,B)x is the negative
+            // of the x-component of V cross B. Note that "X" is the direction
+            // the solver is running in this case, not necessarily the true "X".
             //  F_x[(grid_enum::fluxX_magnetic_z)*n_cells] = VxBy - BxVy = -(-cross(V,B))z = -EMF_Z
             //  F_x[(grid_enum::fluxX_magnetic_y)*n_cells] = VxBz - BxVz =  (-cross(V,B))y =  EMF_Y
             //  F_y[(grid_enum::fluxY_magnetic_x)*n_cells] = VxBy - BxVy = -(-cross(V,B))z = -EMF_X

From d05c4e61b215f3511804e62e3ca55355dce79e34 Mon Sep 17 00:00:00 2001
From: Bob Caddy <r.Caddy@pitt.edu>
Date: Tue, 10 Jan 2023 13:56:49 -0500
Subject: [PATCH 17/18] Add MHD support to python_scripts/cat_dset_3D.py

---
 python_scripts/cat_dset_3D.py | 29 +++++++++++++++++++++++------
 1 file changed, 23 insertions(+), 6 deletions(-)

diff --git a/python_scripts/cat_dset_3D.py b/python_scripts/cat_dset_3D.py
index 0c6d4b3ad..1a823e268 100755
--- a/python_scripts/cat_dset_3D.py
+++ b/python_scripts/cat_dset_3D.py
@@ -11,11 +11,10 @@
 iend = 1*n_proc
 dnamein = './hdf5/raw/'
 dnameout = './hdf5/'
-DE = 0
 
 # loop over outputs
 for n in range(ns, ne+1):
-  
+
   # loop over files for a given output
   for i in range(istart, iend):
 
@@ -26,7 +25,7 @@
     # read in the header data from the input file
     head = filein.attrs
 
-    # if it's the first input file, write the header attributes 
+    # if it's the first input file, write the header attributes
     # and create the datasets in the output file
     if (i == 0):
       nx = head['dims'][0]
@@ -47,8 +46,17 @@
       my = fileout.create_dataset("momentum_y", (nx, ny, nz), chunks=True)
       mz = fileout.create_dataset("momentum_z", (nx, ny, nz), chunks=True)
       E  = fileout.create_dataset("Energy", (nx, ny, nz), chunks=True)
-      if (DE):
+      try:
         GE = fileout.create_dataset("GasEnergy", (nx, ny, nz), chunks=True)
+      except KeyError:
+        print('No Dual energy data present');
+      try:
+        [nx_mag, ny_mag, nz_mag] = head['magnetic_field_dims']
+        bx = fileout.create_dataset("magnetic_x", (nx_mag, ny_mag, nz_mag), chunks=True)
+        by = fileout.create_dataset("magnetic_y", (nx_mag, ny_mag, nz_mag), chunks=True)
+        bz = fileout.create_dataset("magnetic_z", (nx_mag, ny_mag, nz_mag), chunks=True)
+      except KeyError:
+        print('No magnetic field data present');
 
     # write data from individual processor file to
     # correct location in concatenated file
@@ -63,9 +71,18 @@
     fileout['momentum_y'][xs:xs+nxl,ys:ys+nyl,zs:zs+nzl] = filein['momentum_y']
     fileout['momentum_z'][xs:xs+nxl,ys:ys+nyl,zs:zs+nzl] = filein['momentum_z']
     fileout['Energy'][xs:xs+nxl,ys:ys+nyl,zs:zs+nzl]  = filein['Energy']
-    if (DE):
+    try:
       fileout['GasEnergy'][xs:xs+nxl,ys:ys+nyl,zs:zs+nzl] = filein['GasEnergy']
-      
+    except KeyError:
+        print('No Dual energy data present');
+    try:
+      [nxl_mag, nyl_mag, nzl_mag] = head['magnetic_field_dims_local']
+      fileout['magnetic_x'][xs:xs+nxl_mag,ys:ys+nyl_mag,zs:zs+nzl_mag] = filein['magnetic_x']
+      fileout['magnetic_y'][xs:xs+nxl_mag,ys:ys+nyl_mag,zs:zs+nzl_mag] = filein['magnetic_y']
+      fileout['magnetic_z'][xs:xs+nxl_mag,ys:ys+nyl_mag,zs:zs+nzl_mag] = filein['magnetic_z']
+    except KeyError:
+        print('No magnetic field data present');
+
     filein.close()
 
   fileout.close()

From 75ff03a5b55cd4a057ff2e5c8e990b4a98fe5835 Mon Sep 17 00:00:00 2001
From: Bob Caddy <r.Caddy@pitt.edu>
Date: Tue, 10 Jan 2023 14:01:12 -0500
Subject: [PATCH 18/18] Remove support for averaging slow cells in MHD

We're not entirely sure how to do this and since it probably isn't
required we're removing support for now.

Also, slightly refactored the MHD part of the timestep calculation to
combine two #ifdef statements into one
---
 src/hydro/hydro_cuda.cu | 27 ++++-----------------------
 1 file changed, 4 insertions(+), 23 deletions(-)

diff --git a/src/hydro/hydro_cuda.cu b/src/hydro/hydro_cuda.cu
index e6b110ffc..7ad6e994a 100644
--- a/src/hydro/hydro_cuda.cu
+++ b/src/hydro/hydro_cuda.cu
@@ -548,14 +548,12 @@ __global__ void Calc_dt_3D(Real *dev_conserved, Real *dev_dti, Real gamma, int n
       vy    = dev_conserved[2*n_cells + id] * d_inv;
       vz    = dev_conserved[3*n_cells + id] * d_inv;
       E     = dev_conserved[4*n_cells + id];
+
+      // Compute the maximum inverse crossing time in the cell
       #ifdef  MHD
         // Compute the cell centered magnetic field using a straight average of
         // the faces
         auto const [avgBx, avgBy, avgBz] = mhd::utils::cellCenteredMagneticFields(dev_conserved, id, xid, yid, zid, n_cells, nx, ny);
-      #endif  //MHD
-
-      // Compute the maximum inverse crossing time in the cell
-      #ifdef  MHD
         max_dti = fmax(max_dti,mhdInverseCrossingTime(E, d, d_inv, vx, vy, vz, avgBx, avgBy, avgBz, dx, dy, dz, gamma));
       #else  // not MHD
         max_dti = fmax(max_dti,hydroInverseCrossingTime(E, d, d_inv, vx, vy, vz, dx, dy, dz, gamma));
@@ -646,17 +644,8 @@ __global__ void Average_Slow_Cells_3D(Real *dev_conserved, int nx, int ny, int n
     vz =  dev_conserved[3*n_cells + id] * d_inv;
     E  =  dev_conserved[4*n_cells + id];
 
-    #ifdef  MHD
-      // Compute the cell centered magnetic field using a straight average of the faces
-      auto [avgBx, avgBy, avgBz] = mhdUtils::cellCenteredMagneticFields(dev_conserved, id, xid, yid, zid, n_cells, nx, ny);
-    #endif  //MHD
-
     // Compute the maximum inverse crossing time in the cell
-    #ifdef  MHD
-      max_dti = mhdInverseCrossingTime(E, d, d_inv, vx, vy, vz, avgBx, avgBy, avgBz, dx, dy, dz, gamma);
-    #else  // not MHD
-      max_dti = hydroInverseCrossingTime(E, d, d_inv, vx, vy, vz, dx, dy, dz, gamma);
-    #endif  //MHD
+    max_dti = hydroInverseCrossingTime(E, d, d_inv, vx, vy, vz, dx, dy, dz, gamma);
 
     if (max_dti > max_dti_slow){
       speed = sqrt(vx*vx + vy*vy + vz*vz);
@@ -1185,15 +1174,7 @@ __device__ void Average_Cell_All_Fields( int i, int j, int k, int nx, int ny, in
   Average_Cell_Single_Field( 3, i, j, k, nx, ny, nz, ncells, conserved );
   // Average Energy
   Average_Cell_Single_Field( 4, i, j, k, nx, ny, nz, ncells, conserved );
-  #ifdef  MHD
-    // Average MHD
-    Average_Cell_Single_Field( grid_enum::magnetic_x, i,   j,   k,   nx, ny, nz, ncells, conserved );
-    Average_Cell_Single_Field( grid_enum::magnetic_y, i,   j,   k,   nx, ny, nz, ncells, conserved );
-    Average_Cell_Single_Field( grid_enum::magnetic_z, i,   j,   k,   nx, ny, nz, ncells, conserved );
-    Average_Cell_Single_Field( grid_enum::magnetic_x, i-1, j,   k,   nx, ny, nz, ncells, conserved );
-    Average_Cell_Single_Field( grid_enum::magnetic_y, i,   j-1, k,   nx, ny, nz, ncells, conserved );
-    Average_Cell_Single_Field( grid_enum::magnetic_z, i,   j,   k-1, nx, ny, nz, ncells, conserved );
-  #endif  //MHD
+
   #ifdef DE
   // Average GasEnergy
   Average_Cell_Single_Field( n_fields-1, i, j, k, nx, ny, nz, ncells, conserved );