From fa357c118dd2db162ce8288046c871f835b9b37f Mon Sep 17 00:00:00 2001
From: David Bold <dave@ipp.mpg.de>
Date: Tue, 19 Mar 2024 15:43:50 +0100
Subject: [PATCH 001/129] Add isFci to check if a field is a FCI field.

---
 include/bout/field.hxx | 5 +++++
 1 file changed, 5 insertions(+)
diff --git a/include/bout/field.hxx b/include/bout/field.hxx
index c0693ec0fb..c0ce04dbed 100644
--- a/include/bout/field.hxx
+++ b/include/bout/field.hxx
@@ -178,6 +178,11 @@ inline bool areFieldsCompatible(const Field& field1, const Field& field2) {
 #define ASSERT1_FIELDS_COMPATIBLE(field1, field2) ;
 #endif
 
+template <typename F>
+inline bool isFci(const F& f) {
+  return not f.getCoordinates()->getParallelTransform().canToFromFieldAligned();
+}
+
 /// Return an empty shell field of some type derived from Field, with metadata
 /// copied and a data array that is allocated but not initialised.
 template <typename T>

From ca59edb366be164e3583dc6041ea26d28c569ed8 Mon Sep 17 00:00:00 2001
From: David Bold <dave@ipp.mpg.de>
Date: Fri, 3 Nov 2023 14:04:13 +0100
Subject: [PATCH 002/129] Improve isFci

Ensure this does not crash if coordinates or transform is not set.
In this case no FCI transformation is set, and this returns false.
---
 include/bout/field.hxx | 9 ++++++++-
 1 file changed, 8 insertions(+), 1 deletion(-)

diff --git a/include/bout/field.hxx b/include/bout/field.hxx
index c0ce04dbed..4433af6d19 100644
--- a/include/bout/field.hxx
+++ b/include/bout/field.hxx
@@ -180,7 +180,14 @@ inline bool areFieldsCompatible(const Field& field1, const Field& field2) {
 
 template <typename F>
 inline bool isFci(const F& f) {
-  return not f.getCoordinates()->getParallelTransform().canToFromFieldAligned();
+  const auto coords = f.getCoordinates();
+  if (coords == nullptr){
+    return false;
+  }
+  if (not coords->hasParallelTransform()) {
+    return false;
+  }
+  return not coords->getParallelTransform().canToFromFieldAligned();
 }
 
 /// Return an empty shell field of some type derived from Field, with metadata

From 8b1fbba650fbaa17c572c7036c4a3d949892cece Mon Sep 17 00:00:00 2001
From: dschwoerer <dschwoerer@users.noreply.github.com>
Date: Tue, 19 Mar 2024 15:27:28 +0000
Subject: [PATCH 003/129] Apply clang-format changes

---
 include/bout/field.hxx | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/include/bout/field.hxx b/include/bout/field.hxx
index 4433af6d19..61e4af4d4b 100644
--- a/include/bout/field.hxx
+++ b/include/bout/field.hxx
@@ -181,7 +181,7 @@ inline bool areFieldsCompatible(const Field& field1, const Field& field2) {
 template <typename F>
 inline bool isFci(const F& f) {
   const auto coords = f.getCoordinates();
-  if (coords == nullptr){
+  if (coords == nullptr) {
     return false;
   }
   if (not coords->hasParallelTransform()) {

From 23d309f2532376be77e653535e9e67f96915d20b Mon Sep 17 00:00:00 2001
From: David Bold <dave@ipp.mpg.de>
Date: Wed, 20 Mar 2024 10:28:57 +0100
Subject: [PATCH 004/129] Make isFci a member function and add missing func

---
 include/bout/coordinates.hxx |  5 +++--
 include/bout/field.hxx       | 14 ++------------
 src/field/field.cxx          | 11 +++++++++++
 3 files changed, 16 insertions(+), 14 deletions(-)

diff --git a/include/bout/coordinates.hxx b/include/bout/coordinates.hxx
index 49feffa0a7..5ea2d276fc 100644
--- a/include/bout/coordinates.hxx
+++ b/include/bout/coordinates.hxx
@@ -133,9 +133,10 @@ public:
     transform = std::move(pt);
   }
 
+  bool hasParallelTransform() const { return transform != nullptr; }
   /// Return the parallel transform
-  ParallelTransform& getParallelTransform() {
-    ASSERT1(transform != nullptr);
+  ParallelTransform& getParallelTransform() const {
+    ASSERT1(hasParallelTransform());
     return *transform;
   }
 
diff --git a/include/bout/field.hxx b/include/bout/field.hxx
index 61e4af4d4b..d0828e8f6c 100644
--- a/include/bout/field.hxx
+++ b/include/bout/field.hxx
@@ -86,6 +86,8 @@ public:
 
   std::string name;
 
+  bool isFci() const;
+
 #if CHECK > 0
   // Routines to test guard/boundary cells set
 
@@ -178,18 +180,6 @@ inline bool areFieldsCompatible(const Field& field1, const Field& field2) {
 #define ASSERT1_FIELDS_COMPATIBLE(field1, field2) ;
 #endif
 
-template <typename F>
-inline bool isFci(const F& f) {
-  const auto coords = f.getCoordinates();
-  if (coords == nullptr) {
-    return false;
-  }
-  if (not coords->hasParallelTransform()) {
-    return false;
-  }
-  return not coords->getParallelTransform().canToFromFieldAligned();
-}
-
 /// Return an empty shell field of some type derived from Field, with metadata
 /// copied and a data array that is allocated but not initialised.
 template <typename T>
diff --git a/src/field/field.cxx b/src/field/field.cxx
index e48a8f3ef7..c9373454bf 100644
--- a/src/field/field.cxx
+++ b/src/field/field.cxx
@@ -39,3 +39,14 @@ int Field::getNx() const { return getMesh()->LocalNx; }
 int Field::getNy() const { return getMesh()->LocalNy; }
 
 int Field::getNz() const { return getMesh()->LocalNz; }
+
+bool Field::isFci() const {
+  const auto coords = this->getCoordinates();
+  if (coords == nullptr) {
+    return false;
+  }
+  if (not coords->hasParallelTransform()) {
+    return false;
+  }
+  return not coords->getParallelTransform().canToFromFieldAligned();
+}

From 18fca62f3367981fc173ba58297715e9e3f2c351 Mon Sep 17 00:00:00 2001
From: David Bold <dschwoerer@users.noreply.github.com>
Date: Fri, 12 Apr 2024 15:00:21 +0200
Subject: [PATCH 005/129] Make it explicit that this is a pointer

---
 src/field/field.cxx | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/field/field.cxx b/src/field/field.cxx
index c9373454bf..797df6c405 100644
--- a/src/field/field.cxx
+++ b/src/field/field.cxx
@@ -41,7 +41,7 @@ int Field::getNy() const { return getMesh()->LocalNy; }
 int Field::getNz() const { return getMesh()->LocalNz; }
 
 bool Field::isFci() const {
-  const auto coords = this->getCoordinates();
+  const auto* coords = this->getCoordinates();
   if (coords == nullptr) {
     return false;
   }

From 44084cca1fa150f760102aa10d97b4be714ed10e Mon Sep 17 00:00:00 2001
From: David Bold <dave@ipp.mpg.de>
Date: Tue, 2 Jul 2024 14:38:47 +0200
Subject: [PATCH 006/129] Add isFci also to mesh

---
 include/bout/mesh.hxx | 11 +++++++++++
 1 file changed, 11 insertions(+)

diff --git a/include/bout/mesh.hxx b/include/bout/mesh.hxx
index c80716fc12..a3a36ad933 100644
--- a/include/bout/mesh.hxx
+++ b/include/bout/mesh.hxx
@@ -828,6 +828,17 @@ public:
     ASSERT1(RegionID.has_value());
     return region3D[RegionID.value()];
   }
+  bool isFci() const {
+    const auto coords = this->getCoordinatesConst();
+    if (coords == nullptr) {
+      return false;
+    }
+    if (not coords->hasParallelTransform()) {
+      return false;
+    }
+    return not coords->getParallelTransform().canToFromFieldAligned();
+  }
+
 
 private:
   /// Allocates default Coordinates objects

From cd288e98d1964d517380ce883fcb83da1106e3f0 Mon Sep 17 00:00:00 2001
From: David Bold <dave@ipp.mpg.de>
Date: Fri, 9 Aug 2024 10:47:16 +0200
Subject: [PATCH 007/129] Add const version for getCoordinates

---
 include/bout/mesh.hxx | 13 +++++++++++++
 1 file changed, 13 insertions(+)

diff --git a/include/bout/mesh.hxx b/include/bout/mesh.hxx
index a3a36ad933..ccc979987b 100644
--- a/include/bout/mesh.hxx
+++ b/include/bout/mesh.hxx
@@ -636,6 +636,19 @@ public:
     return inserted.first->second;
   }
 
+  std::shared_ptr<Coordinates>
+  getCoordinatesConst(const CELL_LOC location = CELL_CENTRE) const {
+    ASSERT1(location != CELL_DEFAULT);
+    ASSERT1(location != CELL_VSHIFT);
+
+    auto found = coords_map.find(location);
+    if (found != coords_map.end()) {
+      // True branch most common, returns immediately
+      return found->second;
+    }
+    throw BoutException("Coordinates not yet set. Use non-const version!");
+  }
+
   /// Returns the non-CELL_CENTRE location
   /// allowed as a staggered location
   CELL_LOC getAllowedStaggerLoc(DIRECTION direction) const {

From 061b82ffbd14373f744ad205f6577c3c03120b3a Mon Sep 17 00:00:00 2001
From: dschwoerer <dschwoerer@users.noreply.github.com>
Date: Tue, 22 Oct 2024 10:04:02 +0000
Subject: [PATCH 008/129] Apply clang-format changes

---
 include/bout/mesh.hxx | 1 -
 1 file changed, 1 deletion(-)

diff --git a/include/bout/mesh.hxx b/include/bout/mesh.hxx
index ccc979987b..c1a6a1336d 100644
--- a/include/bout/mesh.hxx
+++ b/include/bout/mesh.hxx
@@ -852,7 +852,6 @@ public:
     return not coords->getParallelTransform().canToFromFieldAligned();
   }
 
-
 private:
   /// Allocates default Coordinates objects
   /// By default attempts to read staggered Coordinates from grid data source,

From ececfb831dff6ae17aff36924fe01e97c9eeb7d7 Mon Sep 17 00:00:00 2001
From: David Bold <dave@ipp.mpg.de>
Date: Wed, 6 Nov 2024 16:46:26 +0100
Subject: [PATCH 009/129] Apply suggestions from clang-tidy

---
 include/bout/mesh.hxx | 5 ++---
 1 file changed, 2 insertions(+), 3 deletions(-)

diff --git a/include/bout/mesh.hxx b/include/bout/mesh.hxx
index c1a6a1336d..ed9f6f8d60 100644
--- a/include/bout/mesh.hxx
+++ b/include/bout/mesh.hxx
@@ -651,7 +651,7 @@ public:
 
   /// Returns the non-CELL_CENTRE location
   /// allowed as a staggered location
-  CELL_LOC getAllowedStaggerLoc(DIRECTION direction) const {
+  static CELL_LOC getAllowedStaggerLoc(DIRECTION direction) {
     AUTO_TRACE();
     switch (direction) {
     case (DIRECTION::X):
@@ -860,8 +860,7 @@ private:
   /// (useful if CELL_CENTRE Coordinates have been changed, so reading from file
   /// would not be correct).
   std::shared_ptr<Coordinates>
-  createDefaultCoordinates(const CELL_LOC location,
-                           bool force_interpolate_from_centre = false);
+  createDefaultCoordinates(CELL_LOC location, bool force_interpolate_from_centre = false);
 
   //Internal region related information
   std::map<std::string, size_t> regionMap3D;

From aebca7ea5714c1e79297d81022325e59049799fb Mon Sep 17 00:00:00 2001
From: Peter Hill <peter.hill@york.ac.uk>
Date: Mon, 10 Feb 2025 15:59:34 +0000
Subject: [PATCH 010/129] CI: Bump clang-tidy-review

---
 .github/workflows/clang-tidy-review.yml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/clang-tidy-review.yml b/.github/workflows/clang-tidy-review.yml
index 8ddcd4ae3f..834caa4d22 100644
--- a/.github/workflows/clang-tidy-review.yml
+++ b/.github/workflows/clang-tidy-review.yml
@@ -22,7 +22,7 @@ jobs:
           submodules: true
 
       - name: Run clang-tidy
-        uses: ZedThree/clang-tidy-review@v0.19.0
+        uses: ZedThree/clang-tidy-review@v0.20.1
         id: review
         with:
           annotations: true
@@ -48,4 +48,4 @@ jobs:
                              -DBOUT_UPDATE_GIT_SUBMODULE=OFF
 
       - name: Upload clang-tidy fixes
-        uses: ZedThree/clang-tidy-review/upload@v0.19.0
+        uses: ZedThree/clang-tidy-review/upload@v0.20.1

From cc8c683a97a098aeb8875d4519ec3b5881e3b495 Mon Sep 17 00:00:00 2001
From: Peter Hill <peter.hill@york.ac.uk>
Date: Mon, 10 Feb 2025 17:28:10 +0000
Subject: [PATCH 011/129] CI: Disable annotations for clang-tidy-review

---
 .github/workflows/clang-tidy-review.yml | 1 -
 1 file changed, 1 deletion(-)

diff --git a/.github/workflows/clang-tidy-review.yml b/.github/workflows/clang-tidy-review.yml
index 834caa4d22..1e2f88d208 100644
--- a/.github/workflows/clang-tidy-review.yml
+++ b/.github/workflows/clang-tidy-review.yml
@@ -25,7 +25,6 @@ jobs:
         uses: ZedThree/clang-tidy-review@v0.20.1
         id: review
         with:
-          annotations: true
           build_dir: build
           apt_packages: "libfftw3-dev,libnetcdf-c++4-dev,libopenmpi-dev,petsc-dev,slepc-dev,liblapack-dev,libparpack2-dev,libsundials-dev,uuid-dev"
           config_file: ".clang-tidy"

From 9063bf16186d29fbc73a2cb3fd0f1b8e8af7ce7c Mon Sep 17 00:00:00 2001
From: David Bold <dave@ipp.mpg.de>
Date: Tue, 11 Feb 2025 09:47:23 +0100
Subject: [PATCH 012/129] CI: Show more output of dnf5 to help debugging

---
 .ci_fedora.sh | 1 +
 1 file changed, 1 insertion(+)

diff --git a/.ci_fedora.sh b/.ci_fedora.sh
index 77e7f45055..359516ab33 100755
--- a/.ci_fedora.sh
+++ b/.ci_fedora.sh
@@ -41,6 +41,7 @@ then
     # Ignore weak depencies
     echo "install_weak_deps=False" >> /etc/dnf/dnf.conf
     echo "minrate=10M" >> /etc/dnf/dnf.conf
+    export FORCE_COLUMNS=200
     time dnf -y install dnf5
     time dnf5 -y install dnf5-plugins cmake python3-zoidberg python3-natsort
     # Allow to override packages - see #2073

From d377379e7d5af7373411fb2650d8759f586cd012 Mon Sep 17 00:00:00 2001
From: Ben Dudson <dudson2@llnl.gov>
Date: Tue, 4 Mar 2025 17:04:21 -0800
Subject: [PATCH 013/129] elm-pb example: Adding relaxing phi boundaries

Adds an option phi_boundary_relax. If set to true, then the radial
boundary conditions on the potential phi are relaxed over a given
timescale towards zero gradient.

Adapted from Hermes-3
(https://github.com/boutproject/hermes-3/blob/master/src/vorticity.cxx#L261).
---
 examples/elm-pb/elm_pb.cxx        | 310 ++++++++++++++++++++++++++----
 examples/elm-pb/relaxing/BOUT.inp | 299 ++++++++++++++++++++++++++++
 2 files changed, 573 insertions(+), 36 deletions(-)
 create mode 100644 examples/elm-pb/relaxing/BOUT.inp

diff --git a/examples/elm-pb/elm_pb.cxx b/examples/elm-pb/elm_pb.cxx
index f830f3d98a..4c34dee0ad 100644
--- a/examples/elm-pb/elm_pb.cxx
+++ b/examples/elm-pb/elm_pb.cxx
@@ -17,6 +17,9 @@
 #include <bout/sourcex.hxx>
 #include <bout/utils.hxx>
 
+#include <bout/difops.hxx>
+#include <bout/fv_ops.hxx>
+
 #include <math.h>
 
 #if BOUT_HAS_HYPRE
@@ -46,6 +49,7 @@ class ELMpb : public PhysicsModel {
   Coordinates::FieldMetric U0; // 0th vorticity of equilibrium flow,
   // radial flux coordinate, normalized radial flux coordinate
 
+  bool laplace_perp; // Use Laplace_perp or Delp2?
   bool constn0;
   // the total height, average width and center of profile of N0
   BoutReal n0_height, n0_ave, n0_width, n0_center, n0_bottom_x, Nbar, Tibar, Tebar;
@@ -203,7 +207,11 @@ class ELMpb : public PhysicsModel {
 
   bool parallel_lr_diff; // Use left and right shifted stencils for parallel differences
 
-  bool phi_constraint; // Solver for phi using a solver constraint
+  bool phi_constraint;               // Solver for phi using a solver constraint
+  bool phi_boundary_relax;           // Relax x boundaries of phi towards Neumann?
+  bool phi_core_averagey;            // Average phi core boundary in Y?
+  BoutReal phi_boundary_timescale;   // Relaxation timescale
+  BoutReal phi_boundary_last_update; // Time when last updated
 
   bool include_rmp; // Include RMP coil perturbation
   bool simple_rmp;  // Just use a simple form for the perturbation
@@ -350,7 +358,8 @@ class ELMpb : public PhysicsModel {
     //////////////////////////////////////////////////////////////
     auto& globalOptions = Options::root();
     auto& options = globalOptions["highbeta"];
-
+    laplace_perp = options["laplace_perp"].withDefault(false);
+    // Use Laplace_perp rather than Delp2
     constn0 = options["constn0"].withDefault(true);
     // use the hyperbolic profile of n0. If both  n0_fake_prof and
     // T0_fake_prof are false, use the profiles from grid file
@@ -377,6 +386,9 @@ class ELMpb : public PhysicsModel {
     phi_constraint = options["phi_constraint"]
                          .doc("Use solver constraint for phi?")
                          .withDefault(false);
+    phi_boundary_relax = options["phi_boundary_relax"]
+                             .doc("Relax x boundaries of phi towards Neumann?")
+                             .withDefault<bool>(false);
 
     // Effects to include/exclude
     include_curvature = options["include_curvature"].withDefault(true);
@@ -1148,6 +1160,24 @@ class ELMpb : public PhysicsModel {
 
     aparSolver = Laplacian::create(&globalOptions["aparSolver"], loc);
 
+    if (phi_boundary_relax) {
+      // Set the last update time to -1, so it will reset
+      // the first time RHS function is called
+      phi_boundary_last_update = -1.;
+      phi_core_averagey = options["phi_core_averagey"]
+                              .doc("Average phi core boundary in Y?")
+                              .withDefault<bool>(false)
+                          and mesh->periodicY(mesh->xstart);
+
+      phi_boundary_timescale = options["phi_boundary_timescale"]
+                                   .doc("Timescale for phi boundary relaxation [seconds]")
+                                   .withDefault(1e-7)
+                               / Tbar; // Normalise time units to Tbar
+
+      phiSolver->setInnerBoundaryFlags(INVERT_SET);
+      phiSolver->setOuterBoundaryFlags(INVERT_SET);
+    }
+
     /////////////// CHECK VACUUM ///////////////////////
     // In vacuum region, initial vorticity should equal zero
 
@@ -1315,10 +1345,124 @@ class ELMpb : public PhysicsModel {
       Ctmp.applyBoundary();
       Ctmp -= phi; // Now contains error in the boundary
 
-      C_phi = Delp2(phi) - U; // Error in the bulk
+      if (laplace_perp) {
+        C_phi = Laplace_perp(phi) - U; // Error in the bulk
+      } else {
+        C_phi = Delp2(phi) - U; // Error in the bulk
+      }
       C_phi.setBoundaryTo(Ctmp);
 
     } else {
+      if (phi_boundary_relax) {
+        // Update the boundary regions by relaxing towards zero gradient
+        // on a given timescale.
+
+        if (phi_boundary_last_update < 0.0) {
+          // First time this has been called.
+          phi_boundary_last_update = t;
+        } else if (t > phi_boundary_last_update) {
+          // Only update if simulation time has advanced
+          // Uses an exponential decay of the weighting of the value in the boundary
+          // so that the solution is well behaved for arbitrary steps
+          BoutReal weight = exp(-(t - phi_boundary_last_update) / phi_boundary_timescale);
+          phi_boundary_last_update = t;
+
+          if (mesh->firstX()) {
+            BoutReal phivalue = 0.0;
+            if (phi_core_averagey) {
+              // Calculate a single phi boundary value for all Y slices
+              BoutReal philocal = 0.0;
+              for (int j = mesh->ystart; j <= mesh->yend; j++) {
+                for (int k = 0; k < mesh->LocalNz; k++) {
+                  philocal += phi(mesh->xstart, j, k);
+                }
+              }
+              MPI_Comm comm_inner = mesh->getYcomm(0);
+              int np;
+              MPI_Comm_size(comm_inner, &np);
+              MPI_Allreduce(&philocal, &phivalue, 1, MPI_DOUBLE, MPI_SUM, comm_inner);
+              phivalue /= (np * mesh->LocalNz * mesh->LocalNy);
+            }
+            for (int j = mesh->ystart; j <= mesh->yend; j++) {
+              if (!phi_core_averagey) {
+                phivalue = 0.0; // Calculate phi boundary for each Y index separately
+                for (int k = 0; k < mesh->LocalNz; k++) {
+                  phivalue += phi(mesh->xstart, j, k);
+                }
+                phivalue /= mesh->LocalNz; // Average in Z of point next to boundary
+              }
+
+              // Old value of phi at boundary. Note: this is constant in Z
+              BoutReal oldvalue =
+                  0.5 * (phi(mesh->xstart - 1, j, 0) + phi(mesh->xstart, j, 0));
+
+              // New value of phi at boundary, relaxing towards phivalue
+              BoutReal newvalue = weight * oldvalue + (1. - weight) * phivalue;
+
+              // Set phi at the boundary to this value
+              for (int k = 0; k < mesh->LocalNz; k++) {
+                phi(mesh->xstart - 1, j, k) = 2. * newvalue - phi(mesh->xstart, j, k);
+                phi(mesh->xstart - 2, j, k) = phi(mesh->xstart - 1, j, k);
+              }
+            }
+          }
+
+          if (mesh->lastX()) {
+            for (int j = mesh->ystart; j <= mesh->yend; j++) {
+              BoutReal phivalue = 0.0;
+              BoutReal oldvalue = 0.0;
+              for (int k = 0; k < mesh->LocalNz; k++) {
+                phivalue = phi(mesh->xend, j, k);
+                oldvalue = 0.5 * (phi(mesh->xend + 1, j, k) + phi(mesh->xend, j, k));
+              }
+
+              // New value of phi at boundary, relaxing towards phivalue
+              BoutReal newvalue = weight * oldvalue + (1. - weight) * phivalue;
+
+              // Set phi at the boundary to this value
+              for (int k = 0; k < mesh->LocalNz; k++) {
+                phi(mesh->xend + 1, j, k) = 2. * newvalue - phi(mesh->xend, j, k);
+                phi(mesh->xend + 2, j, k) = phi(mesh->xend + 1, j, k);
+              }
+            }
+          }
+        }
+      }
+
+      Field3D phi_shift = phi;
+      if (constn0 and diamag) {
+        // Solving for phi + ion pressure term
+        phi_shift += 0.5 * dnorm * P / B0;
+      } else {
+        // Ensure that memory is not shared between phi and phi_shift
+        phi_shift.allocate();
+      }
+
+      // Update boundary conditions.
+      //  The INVERT_SET flag takes the value in the guard (boundary) cell
+      //    and sets the boundary between cells to this value.
+      //    This shift by 1/2 grid cell is important.
+
+      if (mesh->firstX()) {
+        for (int j = mesh->ystart; j <= mesh->yend; j++) {
+          for (int k = 0; k < mesh->LocalNz; k++) {
+            // Average phi + Pi at the boundary, and set the boundary cell
+            // to this value. The phi solver will then put the value back
+            // onto the cell mid-point
+            phi_shift(mesh->xstart - 1, j, k) =
+                0.5 * (phi_shift(mesh->xstart - 1, j, k) + phi_shift(mesh->xstart, j, k));
+          }
+        }
+      }
+
+      if (mesh->lastX()) {
+        for (int j = mesh->ystart; j <= mesh->yend; j++) {
+          for (int k = 0; k < mesh->LocalNz; k++) {
+            phi_shift(mesh->xend + 1, j, k) =
+                0.5 * (phi_shift(mesh->xend + 1, j, k) + phi_shift(mesh->xend, j, k));
+          }
+        }
+      }
 
       if (constn0) {
         if (split_n0) {
@@ -1326,44 +1470,84 @@ class ELMpb : public PhysicsModel {
           // Boussinesq, split
           // Split into axisymmetric and non-axisymmetric components
           Field2D Vort2D = DC(U); // n=0 component
+          Field2D phi_shift_2d = phi2D;
+
+          if (phi_boundary_relax) {
+            phi_shift_2d = DC(phi_shift);
+          }
+          phi_shift -= phi_shift_2d;
 
           // Applies boundary condition for "phi".
           phi2D.applyBoundary(t);
 
           // Solve axisymmetric (n=0) part
-          phi2D = laplacexy->solve(Vort2D, phi2D);
+          phi2D = laplacexy->solve(Vort2D, phi_shift_2d);
 
           // Solve non-axisymmetric part
-          phi = phiSolver->solve(U - Vort2D);
+          phi = phiSolver->solve(U - Vort2D, phi_shift);
 
           phi += phi2D; // Add axisymmetric part
         } else {
-          phi = phiSolver->solve(U);
+          if (phi_boundary_relax) {
+            phi = phiSolver->solve(U, phi_shift);
+          } else {
+            phi = phiSolver->solve(U);
+          }
         }
-
         if (diamag) {
           phi -= 0.5 * dnorm * P / B0;
         }
       } else {
         ubyn = U / N0;
         if (diamag) {
-          ubyn -= 0.5 * dnorm / (N0 * B0) * Delp2(P);
+          if (laplace_perp) {
+            ubyn -= 0.5 * dnorm / (N0 * B0) * Laplace_perp(P);
+          } else {
+            ubyn -= 0.5 * dnorm / (N0 * B0) * Delp2(P);
+          }
           mesh->communicate(ubyn);
         }
         // Invert laplacian for phi
         phiSolver->setCoefC(N0);
         phi = phiSolver->solve(ubyn);
       }
-      // Apply a boundary condition on phi for target plates
-      phi.applyBoundary();
       mesh->communicate(phi);
     }
 
+    if (mesh->firstX()) {
+      for (int i = mesh->xstart - 2; i >= 0; --i) {
+        for (int j = mesh->ystart; j <= mesh->yend; ++j) {
+          for (int k = 0; k < mesh->LocalNz; ++k) {
+            phi(i, j, k) = phi(i + 1, j, k);
+          }
+        }
+      }
+    }
+
+    if (mesh->lastX()) {
+      for (int i = mesh->xend + 2; i < mesh->LocalNx; ++i) {
+        for (int j = mesh->ystart; j <= mesh->yend; ++j) {
+          for (int k = 0; k < mesh->LocalNz; ++k) {
+            phi(i, j, k) = phi(i - 1, j, k);
+          }
+        }
+      }
+    }
+
     if (!evolve_jpar) {
       // Get J from Psi
-      Jpar = Delp2(Psi);
+      if (laplace_perp) {
+        Jpar = Laplace_perp(Psi);
+      } else {
+        Jpar = Delp2(Psi);
+      }
+
       if (include_rmp) {
-        Jpar += Delp2(rmp_Psi);
+        if (laplace_perp) {
+          Jpar += Laplace_perp(rmp_Psi);
+        } else {
+          Jpar += Delp2(rmp_Psi);
+        }
       }
 
       Jpar.applyBoundary();
@@ -1397,8 +1581,11 @@ class ELMpb : public PhysicsModel {
       }
 
       // Get Delp2(J) from J
-      Jpar2 = Delp2(Jpar);
-
+      if (laplace_perp) {
+        Jpar2 = Laplace_perp(Jpar);
+      } else {
+        Jpar2 = Delp2(Jpar);
+      }
       Jpar2.applyBoundary();
       mesh->communicate(Jpar2);
 
@@ -1494,7 +1681,11 @@ class ELMpb : public PhysicsModel {
       // Jpar
       Field3D B0U = B0 * U;
       mesh->communicate(B0U);
-      ddt(Jpar) = -Grad_parP(B0U, loc) / B0 + eta * Delp2(Jpar);
+      if (laplace_perp) {
+        ddt(Jpar) = -Grad_parP(B0U, loc) / B0 + eta * Laplace_perp(Jpar);
+      } else {
+        ddt(Jpar) = -Grad_parP(B0U, loc) / B0 + eta * Delp2(Jpar);
+      }
 
       if (relax_j_vac) {
         // Make ddt(Jpar) relax to zero.
@@ -1524,11 +1715,19 @@ class ELMpb : public PhysicsModel {
       }
 
       if (hyperresist > 0.0) { // Hyper-resistivity
-        ddt(Psi) -= eta * hyperresist * Delp2(Jpar);
+        if (laplace_perp) {
+          ddt(Psi) -= eta * hyperresist * Laplace_perp(Jpar);
+        } else {
+          ddt(Psi) -= eta * hyperresist * Delp2(Jpar);
+        }
       }
 
       if (ehyperviscos > 0.0) { // electron Hyper-viscosity coefficient
-        ddt(Psi) -= eta * ehyperviscos * Delp2(Jpar2);
+        if (laplace_perp) {
+          ddt(Psi) -= eta * ehyperviscos * Laplace_perp(Jpar2);
+        } else {
+          ddt(Psi) -= eta * ehyperviscos * Delp2(Jpar2);
+        }
       }
 
       // Parallel hyper-viscous diffusion for vector potential
@@ -1599,7 +1798,11 @@ class ELMpb : public PhysicsModel {
     }
 
     if (viscos_perp > 0.0) {
-      ddt(U) += viscos_perp * Delp2(U); // Perpendicular viscosity
+      if (laplace_perp) {
+        ddt(U) += viscos_perp * Laplace_perp(U); // Perpendicular viscosity
+      } else {
+        ddt(U) += viscos_perp * Delp2(U); // Perpendicular viscosity
+      }
     }
 
     // Hyper-viscosity
@@ -1626,21 +1829,39 @@ class ELMpb : public PhysicsModel {
       Pi = 0.5 * P;
       Pi0 = 0.5 * P0;
 
-      Dperp2Phi0 = Field3D(Delp2(B0 * phi0));
-      Dperp2Phi0.applyBoundary();
-      mesh->communicate(Dperp2Phi0);
+      if (laplace_perp) {
+        Dperp2Phi0 = Field3D(Laplace_perp(B0 * phi0));
+        Dperp2Phi0.applyBoundary();
+        mesh->communicate(Dperp2Phi0);
+
+        Dperp2Phi = Laplace_perp(B0 * phi);
+        Dperp2Phi.applyBoundary();
+        mesh->communicate(Dperp2Phi);
+
+        Dperp2Pi0 = Field3D(Laplace_perp(Pi0));
+        Dperp2Pi0.applyBoundary();
+        mesh->communicate(Dperp2Pi0);
+
+        Dperp2Pi = Laplace_perp(Pi);
+        Dperp2Pi.applyBoundary();
+        mesh->communicate(Dperp2Pi);
+      } else {
+        Dperp2Phi0 = Field3D(Delp2(B0 * phi0));
+        Dperp2Phi0.applyBoundary();
+        mesh->communicate(Dperp2Phi0);
 
-      Dperp2Phi = Delp2(B0 * phi);
-      Dperp2Phi.applyBoundary();
-      mesh->communicate(Dperp2Phi);
+        Dperp2Phi = Delp2(B0 * phi);
+        Dperp2Phi.applyBoundary();
+        mesh->communicate(Dperp2Phi);
 
-      Dperp2Pi0 = Field3D(Delp2(Pi0));
-      Dperp2Pi0.applyBoundary();
-      mesh->communicate(Dperp2Pi0);
+        Dperp2Pi0 = Field3D(Delp2(Pi0));
+        Dperp2Pi0.applyBoundary();
+        mesh->communicate(Dperp2Pi0);
 
-      Dperp2Pi = Delp2(Pi);
-      Dperp2Pi.applyBoundary();
-      mesh->communicate(Dperp2Pi);
+        Dperp2Pi = Delp2(Pi);
+        Dperp2Pi.applyBoundary();
+        mesh->communicate(Dperp2Pi);
+      }
 
       bracketPhi0P = bracket(B0 * phi0, Pi, bm_exb);
       bracketPhi0P.applyBoundary();
@@ -1658,8 +1879,13 @@ class ELMpb : public PhysicsModel {
       mesh->communicate(B0phi0);
       ddt(U) += 0.5 * Upara2 * bracket(B0phi, Dperp2Pi0, bm_exb) / B0;
       ddt(U) += 0.5 * Upara2 * bracket(B0phi0, Dperp2Pi, bm_exb) / B0;
-      ddt(U) -= 0.5 * Upara2 * Delp2(bracketPhi0P) / B0;
-      ddt(U) -= 0.5 * Upara2 * Delp2(bracketPhiP0) / B0;
+      if (laplace_perp) {
+        ddt(U) -= 0.5 * Upara2 * Laplace_perp(bracketPhi0P) / B0;
+        ddt(U) -= 0.5 * Upara2 * Laplace_perp(bracketPhiP0) / B0;
+      } else {
+        ddt(U) -= 0.5 * Upara2 * Delp2(bracketPhi0P) / B0;
+        ddt(U) -= 0.5 * Upara2 * Delp2(bracketPhiP0) / B0;
+      }
 
       if (nonlinear) {
         Field3D B0phi = B0 * phi;
@@ -1670,7 +1896,11 @@ class ELMpb : public PhysicsModel {
 
         ddt(U) -= 0.5 * Upara2 * bracket(Pi, Dperp2Phi, bm_exb) / B0;
         ddt(U) += 0.5 * Upara2 * bracket(B0phi, Dperp2Pi, bm_exb) / B0;
-        ddt(U) -= 0.5 * Upara2 * Delp2(bracketPhiP) / B0;
+        if (laplace_perp) {
+          ddt(U) -= 0.5 * Upara2 * Laplace_perp(bracketPhiP) / B0;
+        } else {
+          ddt(U) -= 0.5 * Upara2 * Delp2(bracketPhiP) / B0;
+        }
       }
     }
 
@@ -1808,7 +2038,12 @@ class ELMpb : public PhysicsModel {
   int precon(BoutReal UNUSED(t), BoutReal gamma, BoutReal UNUSED(delta)) {
     // First matrix, applying L
     mesh->communicate(ddt(Psi));
-    Field3D Jrhs = Delp2(ddt(Psi));
+    Field3D Jrhs;
+    if (laplace_perp) {
+      Jrhs = Laplace_perp(ddt(Psi));
+    } else {
+      Jrhs = Delp2(ddt(Psi));
+    }
     Jrhs.applyBoundary("neumann");
 
     if (jpar_bndry_width > 0) {
@@ -1880,8 +2115,11 @@ class ELMpb : public PhysicsModel {
 
     phi = phiSolver->solve(ddt(U));
 
-    Jpar = Delp2(ddt(Psi));
-
+    if (laplace_perp) {
+      Jpar = Laplace_perp(ddt(Psi));
+    } else {
+      Jpar = Delp2(ddt(Psi));
+    }
     mesh->communicate(phi, Jpar);
 
     Field3D JP = -b0xGrad_dot_Grad(phi, P0);
diff --git a/examples/elm-pb/relaxing/BOUT.inp b/examples/elm-pb/relaxing/BOUT.inp
new file mode 100644
index 0000000000..d9489611e6
--- /dev/null
+++ b/examples/elm-pb/relaxing/BOUT.inp
@@ -0,0 +1,299 @@
+# settings file for BOUT++
+# High-Beta reduced MHD case
+
+##################################################
+# Global settings used by the core code
+
+nout = 1000         # number of time-steps
+timestep = 1       # time between outputs
+
+zperiod = 5        # Fraction of a torus to simulate
+MZ = 64             # Number of points in Z
+
+grid = "cbm18_dens8.grid_nx68ny64.nc" #"cbm18_dens3_0.5BS_516nx64ny.grid.nc"
+
+[mesh]
+
+staggergrids = false    # Use staggered grids
+
+[mesh:paralleltransform]
+#type = shifted # Use shifted metric method
+type = shiftedinterp
+
+##################################################
+# derivative methods
+
+[mesh:ddx]
+first = C4  # order of first x derivatives
+second = C4 # order of second x derivatives
+upwind = W3 # order of upwinding method W3 = Weno3
+
+[mesh:ddy]
+first = C4
+second = C4
+upwind = W3
+flux = C2
+
+[mesh:ddz]
+first = C4  # Z derivatives can be done using FFT
+second = C4
+upwind = W3
+
+##################################################
+# FFTs
+
+[fft]
+
+fft_measurement_flag = measure  # If using FFTW, perform tests to determine fastest method
+
+[output]
+
+#type = adios
+#shiftoutput = true  # Put the output into field-aligned coordinates
+
+[restart_files]
+
+#type = adios
+
+[laplace]
+
+#type = hypre3d
+#rtol = 1.e-9
+#atol = 1.e-14
+#pctype = sor    # Preconditioner
+
+#atol = 1e-12
+#rtol = 1e-08
+
+
+##################################################
+# Solver settings
+
+[solver]
+
+# mudq, mldq, mukeep, mlkeep preconditioner options
+atol = 1.0e-8 # absolute tolerance
+rtol = 1.0e-5  # relative tolerance
+
+use_precon = false    # Use preconditioner: User-supplied or BBD
+
+mxstep = 50000   # Number of internal steps between outputs
+
+##################################################
+# settings for high-beta reduced MHD
+
+[highbeta]
+
+density = 1.0e19       # number density of deuterium [m^-3]
+                       # used to produce output normalisations
+constn0 = true
+n0_fake_prof = false
+
+sheath_boundaries = false
+
+evolve_jpar = false     # If true, evolve J raher than Psi
+
+evolve_pressure = true # If false, switch off all pressure evolution
+
+phi_constraint = false # Solve phi as a constraint (DAE system, needs IDA)
+
+## Effects to include/exclude
+
+include_jpar0 = true     # determines whether to include jpar0 terms
+include_curvature = true # include curvature drive term?
+
+compress = false       # set compressible (evolve Vpar)
+nonlinear = true       # include non-linear terms?
+
+diamag = true         # Include diamagnetic effects?
+diamag_grad_t = false  # Include Grad_par(Te) term in Psi equation
+diamag_phi0 = true    # Balance ExB against Vd for stationary equilibrium
+
+split_n0 = false
+
+laplace_perp = true
+
+##################################################
+# BRACKET_METHOD flags:
+# 0:BRACKET_STD; derivative methods will be determined
+#   by the choices C or W in this input file
+# 1:BRACKET_SIMPLE; 2:BRACKET_ARAKAWA; 3:BRACKET_CTU.
+
+bm_exb_flag = 0
+bm_mag_flag = 0
+##################################################################
+withflow = false     # With flow or not
+D_0 = 130000        # differential potential
+D_s = 20            # shear parameter
+K_H_term = false    # Contain K-H term
+sign = -1           # flow direction
+x0 = 0.855          # peak location
+D_min = 3000        # constant
+##################################################################
+
+eHall = false         # Include electron pressure effects in Ohm's law?
+AA = 2.0          # ion mass in units of proton mass
+Zeff = 1.0
+#Zi = 1.0
+
+noshear = false        # zero all shear
+
+relax_j_vac = false    # Relax to zero-current in the vacuum
+relax_j_tconst = 1e-2  # Time constant for vacuum relaxation
+
+## Toroidal filtering
+filter_z = false   # remove all except one mode
+filter_z_mode = 1  # Specify which harmonic to keep (1 = fundamental)
+low_pass_z = 16    # Keep up to and including this harmonic (-1 = keep all)
+zonal_flow = true    # keep zonal component of vorticity?
+zonal_field = false  # keep zonal component of Psi?
+zonal_bkgd = true    # keep zonal component of P?
+
+## Jpar smoothing
+smooth_j_x = true  # Filter Jpar in the X direction
+
+## Magnetic perturbations
+include_rmp = false # Read RMP data from grid file
+
+simple_rmp = false  # Enable/disable a simple model of RMP
+rmp_n = 3           # Toroidal mode number
+rmp_m = 6           # Poloidal mode number
+rmp_factor = 1.e-4  # Amplitude of Apar [Tm]
+rmp_ramp = 1.e-4    # Timescale [s] of ramp
+rmp_polwid = -1.0   # Width of Gaussian factor (< 0 = No Gaussian)
+rmp_polpeak = 0.5   # Y location of maximum (fraction)
+
+## Vacuum region control
+
+vacuum_pressure = 0.02 # the pressure below which it is considered vacuum
+                       # fraction of peak pressure
+vacuum_trans = 0.01   # transition width (fraction of P)
+
+## Resistivity and Hyper-resistivity
+
+vac_lund = 1.0e8    # Lundquist number in vacuum  (negative -> infinity)
+core_lund = 1.0e8  # Lundquist number in core (negative -> infinity)
+hyperresist = 1.e-4 # Hyper-resistivity coefficient (like 1 / Lundquist number)
+
+## Inner boundary damping
+
+damp_width = -1       # Width of damping region (grid cells)
+damp_t_const = 1e-2  # Damping time constant
+
+## Parallel pressure diffusion
+
+diffusion_par = 1.0e-2     # Parallel pressure diffusion (< 0 = none)
+diffusion_p4 = -1e-05   # parallel hyper-viscous diffusion for pressure (< 0 = none)
+diffusion_u4 = -1e-05    # parallel hyper-viscous diffusion for vorticity (< 0 = none)
+diffusion_a4 = -1e-05   # parallel hyper-viscous diffusion for vector potential (< 0 = none)
+
+## heat source in pressure in watts
+
+heating_P = -1   #   heat power in watts (< 0 = none)
+hp_width = 0.1     #   heat width, in percentage of nx (< 0 = none)
+hp_length = 0.3    #   heat length in percentage of nx (< 0 = none)
+
+## sink rate in pressure
+
+sink_P = -1   #   sink rate in pressure (< 0 = none)
+sp_width = 0.04     #   sink width, in percentage of nx (< 0 = none)
+sp_length = 0.15    #   sink length in percentage of nx (< 0 = none)
+
+
+## left edge sink rate in vorticity
+sink_Ul = 10.0        #   left edge sink rate in vorticity (< 0 = none)
+su_widthl = 0.06     #   left edge sink width, in percentage of nx (< 0 = none)
+su_lengthl = 0.1     #   left edge sink length in percentage of nx (< 0 = none)
+
+## right edge sink rate in vorticity
+sink_Ur = 10.0        #   right edge sink rate in vorticity (< 0 = none)
+su_widthr = 0.06     #   right edge sink width, in percentage of nx (< 0 = none)
+su_lengthr = 0.1     #   right edge sink length in percentage of nx (< 0 = none)
+
+## Viscosity and Hyper-viscosity
+
+viscos_par = 0.1   # Parallel viscosity (< 0 = none)
+viscos_perp = 1.0e-7  # Perpendicular viscosity (< 0 = none)
+hyperviscos = -1.0  # Radial hyper viscosity
+
+## Compressional terms (only when compress = true)
+phi_curv = true    # Include curvature*Grad(phi) in P equation
+# gamma = 1.6666
+
+phi_boundary_relax = true # Relax phi at radial boundaries towards zero gradient
+phi_core_averagey = false
+phi_boundary_timescale = 1.0e-6 # In seconds
+
+[phiSolver]
+# INVERT_DC_GRAD = 1  // Zero-gradient for DC (constant in Z) component. Default is zero value
+# INVERT_AC_GRAD = 2  // Zero-gradient for AC (non-constant in Z) component. Default is zero value
+# INVERT_AC_LAP = 4   // Use zero-laplacian (decaying solution) to AC component
+# INVERT_DC_LAP = 64  // Use zero-laplacian solution for DC component
+#type = hypre3d
+#rtol = 1.e-9
+#atol = 1.e-14
+#inner_boundary_flags = 0 # 0 for Dirichlet; 2 for Neumann
+#outer_boundary_flags = 0 # 0 for Dirichlet; 2 for Neumann
+#hypre_print_level = 1  # print information on the matrices, solver settings, and iterations.
+
+[aparSolver]
+#type = hypre3d
+#rtol = 1.e-9
+#atol = 1.e-14
+#inner_boundary_flags = 4 # INVERT_AC_LAP
+#outer_boundary_flags = 1 + 4 # INVERT_DC_GRAD + INVERT_AC_LAP
+
+##################################################
+# settings for individual variables
+# The section "All" defines default settings for all variables
+# These can be overridden for individual variables in
+# a section of that name.
+
+[all]
+scale = 0.0 # default size of initial perturbations
+
+# boundary conditions
+# -------------------
+# dirichlet    - Zero value
+# neumann      - Zero gradient
+# zerolaplace  - Laplacian = 0, decaying solution
+# constlaplace - Laplacian = const, decaying solution
+#
+# relax( )   - Make boundary condition relaxing
+
+bndry_all = dirichlet_o2 # Default to zero-value
+
+[U]   # vorticity
+scale = 1e-05
+function = ballooning(gauss(x-0.5,0.1)*gauss(y-pi,0.6*pi)*sin(z),3)
+
+[P]  # pressure
+bndry_core = dirichlet
+#scale = 1.0e-5
+
+[Psi]  # Vector potential
+
+# zero laplacian
+bndry_xin = zerolaplace
+bndry_xout = zerolaplace
+
+[Psi_loc] # for staggering
+
+bndry_xin = zerolaplace
+bndry_xout = zerolaplace
+
+bndry_yup = free_o3
+bndry_ydown = free_o3
+
+[J]    # parallel current
+
+# Zero gradient in the core
+bndry_core = neumann
+
+[phi]
+
+#bndry_core = neumann
+bndry_xin = none
+bndry_xout = none
+#bndry_target = neumann
+

From 5ce6cae6ea94a76417a4c058fdd848db384d36d1 Mon Sep 17 00:00:00 2001
From: Rob Falgout <rfalgout@llnl.gov>
Date: Tue, 4 Mar 2025 17:04:44 -0800
Subject: [PATCH 014/129] First version of code to eliminate boundary equations
 to improve HYPRE solves

---
 include/bout/hypre_interface.hxx              | 193 +++++++++++++-
 .../laplace/impls/hypre3d/hypre3d_laplace.cxx |   6 +
 .../laplace/impls/hypre3d/hypre_boundary.c    | 252 ++++++++++++++++++
 3 files changed, 450 insertions(+), 1 deletion(-)
 create mode 100644 src/invert/laplace/impls/hypre3d/hypre_boundary.c

diff --git a/include/bout/hypre_interface.hxx b/include/bout/hypre_interface.hxx
index ae392de4f3..72eec916e2 100644
--- a/include/bout/hypre_interface.hxx
+++ b/include/bout/hypre_interface.hxx
@@ -20,6 +20,56 @@
 #include "HYPRE_utilities.h"
 #include "_hypre_utilities.h"
 
+HYPRE_Int
+AdjustBCMatrixEquations(
+   HYPRE_Int       nrows,
+   HYPRE_Int      *ncols,
+   HYPRE_BigInt   *rows,
+   HYPRE_Int     **row_indexes_ptr,
+   HYPRE_BigInt   *cols,
+   HYPRE_Complex  *values,
+   HYPRE_Int       nb,              // number of boundary equations
+   HYPRE_Int      *bi_array,        // row i for each boundary equation
+   HYPRE_Int     **binum_array_ptr, // data index for row i (for each boundary equation)
+   HYPRE_Int     **bjnum_array_ptr, // data index for col j (for each boundary equation)
+   HYPRE_Complex **bii_array_ptr,   // coefficient b_ii (for each boundary equation)
+   HYPRE_Complex **bij_array_ptr,   // coefficient b_ij (for each boundary equation)
+   HYPRE_Int      *na_ptr,          // number of interior equations to adjust
+   HYPRE_Int     **aknum_array_ptr, // data index for row k (for each interior equation)
+   HYPRE_Complex **aki_array_ptr);  // coefficient a_ki (for each interior equation)
+
+HYPRE_Int
+AdjustBCRightHandSideEquations(
+   HYPRE_Complex  *rhs,
+   HYPRE_Int       nb,
+   HYPRE_Int      *binum_array,
+   HYPRE_Complex  *bii_array,
+   HYPRE_Complex  *bij_array,
+   HYPRE_Complex **brhs_array_ptr,
+   HYPRE_Int       na,
+   HYPRE_Int      *aknum_array,
+   HYPRE_Complex  *aki_array);
+
+HYPRE_Int
+AdjustBCSolutionEquations(
+   HYPRE_Complex  *solution,
+   HYPRE_Int       nb,
+   HYPRE_Int      *binum_array,
+   HYPRE_Int      *bjnum_array,
+   HYPRE_Complex  *bii_array,
+   HYPRE_Complex  *bij_array,
+   HYPRE_Complex  *brhs_array);
+
+HYPRE_Int
+AdjustBCEquationsFree(
+   HYPRE_Int     *binum_array,
+   HYPRE_Int     *bjnum_array,
+   HYPRE_Complex *bii_array,
+   HYPRE_Complex *bij_array,
+   HYPRE_Complex *brhs_array,
+   HYPRE_Int     *aknum_array,
+   HYPRE_Complex *aki_array);
+
 #include <memory>
 
 // BOUT_ENUM_CLASS does not work inside namespaces
@@ -174,6 +224,24 @@ public:
     HypreMalloc(V, vsize * sizeof(HYPRE_Complex));
   }
 
+  // Data for eliminating boundary equations (TODO: convert this to a structure)
+  bool elimBErhs = false;
+  bool elimBEsol = false;
+  HYPRE_Complex *rhs;
+  HYPRE_Int      nb;
+  HYPRE_Int     *binum_array;
+  HYPRE_Int     *bjnum_array;
+  HYPRE_Complex *bii_array;
+  HYPRE_Complex *bij_array;
+  HYPRE_Complex *brhs_array; // This is not created from the HypreMatrix class
+  HYPRE_Int      na;
+  HYPRE_Int     *aknum_array;
+  HYPRE_Complex *aki_array;
+
+  void syncElimBErhs(HypreVector<T>& rhs) {
+    brhs_array = rhs.brhs_array;
+  }
+
   void assemble() {
     CALI_CXX_MARK_FUNCTION;
     writeCacheToHypre();
@@ -183,11 +251,20 @@ public:
   }
 
   void writeCacheToHypre() {
+    if (elimBErhs)
+    {
+      AdjustBCRightHandSideEquations(V, nb, binum_array, bii_array, bij_array, &brhs_array,
+                                     na, aknum_array, aki_array);
+    }
     checkHypreError(HYPRE_IJVectorSetValues(hypre_vector, vsize, I, V));
   }
 
   void readCacheFromHypre() {
     checkHypreError(HYPRE_IJVectorGetValues(hypre_vector, vsize, I, V));
+    if (elimBEsol)
+    {
+      AdjustBCSolutionEquations(V, nb, binum_array, bjnum_array, bii_array, bij_array, brhs_array);
+    }
   }
 
   T toField() {
@@ -667,6 +744,43 @@ public:
     return Element(*this, global_row, global_column, positions, weights);
   }
 
+  // Data for eliminating boundary equations (TODO: convert this to a structure)
+  bool elimBE = false;
+  HYPRE_Int      nb;
+  HYPRE_Int     *binum_array;
+  HYPRE_Int     *bjnum_array;
+  HYPRE_Complex *bii_array;
+  HYPRE_Complex *bij_array;
+  HYPRE_Int      na;
+  HYPRE_Int     *aknum_array;
+  HYPRE_Complex *aki_array;
+
+  void setElimBE() {
+    elimBE = true;
+  }
+
+  void setElimBEVectors(HypreVector<T>& sol, HypreVector<T>& rhs) {
+    sol.elimBEsol = elimBE;
+    sol.nb          = nb;
+    sol.binum_array = binum_array;
+    sol.bjnum_array = bjnum_array;
+    sol.bii_array   = bii_array;
+    sol.bij_array   = bij_array;
+    sol.na          = na;
+    sol.aknum_array = aknum_array;
+    sol.aki_array   = aki_array;
+
+    rhs.elimBErhs = elimBE;
+    rhs.nb          = nb;
+    rhs.binum_array = binum_array;
+    rhs.bjnum_array = bjnum_array;
+    rhs.bii_array   = bii_array;
+    rhs.bij_array   = bij_array;
+    rhs.na          = na;
+    rhs.aknum_array = aknum_array;
+    rhs.aki_array   = aki_array;
+  }
+
   void assemble() {
     CALI_CXX_MARK_FUNCTION;
 
@@ -695,8 +809,85 @@ public:
         entry++;
       }
     }
-    checkHypreError(
+
+    // Eliminate boundary condition equations in hypre SetValues input arguments
+    if (elimBE)
+    {
+      HYPRE_Int *bi_array;
+      HYPRE_Int *row_indexes;
+      // There must be an easier way to get nb
+      nb = 0;
+      BOUT_FOR_SERIAL(i, index_converter->getRegionBndry()) {
+         nb++;
+      }
+      HypreMalloc(bi_array, nb * sizeof(HYPRE_Int));
+      nb = 0;
+      BOUT_FOR_SERIAL(i, index_converter->getRegionBndry()) {
+         bi_array[nb] = index_converter->getGlobal(i);
+         nb++;
+      }
+      AdjustBCMatrixEquations(num_rows, num_cols, rawI, &row_indexes, cols, vals,
+                              nb, bi_array,
+                              &binum_array, &bjnum_array, &bii_array, &bij_array,
+                              &na, &aknum_array, &aki_array);
+      HypreFree(bi_array);
+//    {
+//       FILE  *file;
+//       int    i;
+//       file = fopen("zbout.setvalues.out2", "w");
+//       fprintf(file, "nrows %d\n", num_rows);
+//       for (i = 0; i < num_rows; i++)
+//       {
+//          fprintf(file, "ncols %d: %d\n", i, num_cols[i]);
+//       }
+//       for (i = 0; i < num_rows; i++)
+//       {
+//          fprintf(file, "rows %d: %d\n", i, rawI[i]);
+//       }
+//       for (i = 0; i < num_entries; i++)
+//       {
+//          fprintf(file, "cols %d: %d\n", i, cols[i]);
+//       }
+//       for (i = 0; i < num_entries; i++)
+//       {
+//          fprintf(file, "vals %d: %f\n", i, vals[i]);
+//       }
+//       fclose(file);
+//
+//       file = fopen("zbout.setvalues.out3", "w");
+//       for (i = 0; i < num_rows; i++)
+//       {
+//          fprintf(file, "row_indexes %d: %d\n", i, row_indexes[i]);
+//       }
+//       fprintf(file, "nb %d\n", nb);
+//       for (i = 0; i < nb; i++)
+//       {
+//          fprintf(file, "bijnum_array %d: %d %d\n", i, binum_array[i], bjnum_array[i]);
+//       }
+//       for (i = 0; i < nb; i++)
+//       {
+//          fprintf(file, "biiij_array %d: %f %f\n", i, bii_array[i], bij_array[i]);
+//       }
+//       fprintf(file, "na %d\n", na);
+//       for (i = 0; i < na; i++)
+//       {
+//          fprintf(file, "aknum_array %d: %d\n", i, aknum_array[i]);
+//       }
+//       for (i = 0; i < na; i++)
+//       {
+//          fprintf(file, "bki_array %d: %f\n", i, aki_array[i]);
+//       }
+//       fclose(file);
+//    }
+      checkHypreError(
+        HYPRE_IJMatrixSetValues2(*hypre_matrix, num_rows, num_cols, rawI, row_indexes, cols, vals));
+      HypreFree(row_indexes);
+    }
+    else
+    {
+      checkHypreError(
         HYPRE_IJMatrixSetValues(*hypre_matrix, num_rows, num_cols, rawI, cols, vals));
+    }
     checkHypreError(HYPRE_IJMatrixAssemble(*hypre_matrix));
     checkHypreError(HYPRE_IJMatrixGetObject(*hypre_matrix,
                                             reinterpret_cast<void**>(&parallel_matrix)));
diff --git a/src/invert/laplace/impls/hypre3d/hypre3d_laplace.cxx b/src/invert/laplace/impls/hypre3d/hypre3d_laplace.cxx
index c50be1db85..def54b36b5 100644
--- a/src/invert/laplace/impls/hypre3d/hypre3d_laplace.cxx
+++ b/src/invert/laplace/impls/hypre3d/hypre3d_laplace.cxx
@@ -28,6 +28,7 @@
 #if BOUT_HAS_HYPRE
 
 #include "hypre3d_laplace.hxx"
+#include "hypre_boundary.c"
 
 #include <bout/assert.hxx>
 #include <bout/boutcomm.hxx>
@@ -218,11 +219,15 @@ Field3D LaplaceHypre3d::solve(const Field3D& b_in, const Field3D& x0) {
 
   CALI_MARK_BEGIN("LaplaceHypre3d_solve:vectorAssemble");
 
+  operator3D.setElimBEVectors(solution, rhs);
+
   rhs.importValuesFromField(b);
   solution.importValuesFromField(x0);
   rhs.assemble();
   solution.assemble();
 
+  solution.syncElimBErhs(rhs);
+
   CALI_MARK_END("LaplaceHypre3d_solve:vectorAssemble");
 
   CALI_MARK_BEGIN("LaplaceHypre3d_solve:solve");
@@ -411,6 +416,7 @@ void LaplaceHypre3d::updateMatrix3D() {
     operator3D.ydown(ydown)(l, l.ym().zp()) += -C_d2f_dydz;
     operator3D.ydown(ydown)(l, l.ym().zm()) += C_d2f_dydz;
   }
+  operator3D.setElimBE();
   operator3D.assemble();
 
   if (print_matrix) {
diff --git a/src/invert/laplace/impls/hypre3d/hypre_boundary.c b/src/invert/laplace/impls/hypre3d/hypre_boundary.c
new file mode 100644
index 0000000000..c4e7393c3f
--- /dev/null
+++ b/src/invert/laplace/impls/hypre3d/hypre_boundary.c
@@ -0,0 +1,252 @@
+
+/*
+ * This function modifies the input for the HYPRE_IJMatrixSetValues() routine to
+ * eliminate the boundary condition equations (see below for details on how the
+ * equations are adjusted).  It modifies the arrays ncols, rows, cols, and
+ * values.  It also returns a row_indexes array.  This can then be passed to the
+ * HYPRE_IJMatrixSetValues2() routine to set up the matrix in hypre.
+ *
+ * The arguments nb and bi_array indicate the boundary equations.  The routine
+ * returns info needed to adjust the right-hand-side and solution vector through
+ * the functions AdjustRightHandSideEquations and AdjustSolutionEquations.
+ *
+ * Returned info arrays can be freed with the function AdjustEquationsFree().
+ *
+ * NOTE: It may make sense from an organizational standpoint to collect many of
+ * these arguments in a structure of some sort.
+ *
+ * Notation, assumptions, and other details:
+ *
+ * - Boundary equation i is assumed to have two coefficients
+ *
+ *      b_ii * u_i + b_ij * u_j = rhs_i
+ *
+ * - We also assume that each boundary equation has only one interior equation k
+ *   coupled to it (such that k = j) with coupling coefficient a_ki
+ *
+ *      a_ki * u_i + a_kj * u_j + ... = rhs_k
+ *
+ * - Each equation k is adjusted as follows:
+ *
+ *      a_kj = a_kj - a_ki * b_ij / b_ii
+ *      a_ki = 0
+ *
+ * - Boundary equations are adjusted to be identity equations in the matrix, but
+ *   the boundary coefficients (b_ii, b_ij) are returned for use later
+ *
+ * - Right-hand-side equations are adjusted in AdjustRightHandSideEquations() as
+ *   follows: rhs_k = rhs_k - a_ki * rhs_i / b_ii
+ *
+ * - Solution unknowns are adjusted at boundaries in AdjustSolutionEquations as
+ *   follows: u_i = (rhs_i - b_ij * u_j) / b_ii
+ *
+ * - Naming conventions: Arrays starting with 'b' are boundary equation arrays
+ *   indexed by 'bnum', and arrays starting with 'a' are non-boundary arrays
+ *   (interior matrix equations) indexed by 'anum'.  When 'num' is prefixed with
+ *   a row or column number 'i', 'j', or 'k', the array holds the corresponding
+ *   local data index for that row or column (e.g., an index into the local
+ *   solution vector).  Matrix coefficients are named as above, e.g., 'bij' is
+ *   the coefficient for b_ij.
+ */
+
+HYPRE_Int
+AdjustBCMatrixEquations(
+   HYPRE_Int       nrows,
+   HYPRE_Int      *ncols,
+   HYPRE_BigInt   *rows,
+   HYPRE_Int     **row_indexes_ptr,
+   HYPRE_BigInt   *cols,
+   HYPRE_Complex  *values,
+   HYPRE_Int       nb,              // number of boundary equations
+   HYPRE_Int      *bi_array,        // row i for each boundary equation
+   HYPRE_Int     **binum_array_ptr, // data index for row i (for each boundary equation)
+   HYPRE_Int     **bjnum_array_ptr, // data index for col j (for each boundary equation)
+   HYPRE_Complex **bii_array_ptr,   // coefficient b_ii (for each boundary equation)
+   HYPRE_Complex **bij_array_ptr,   // coefficient b_ij (for each boundary equation)
+   HYPRE_Int      *na_ptr,          // number of interior equations to adjust
+   HYPRE_Int     **aknum_array_ptr, // data index for row k (for each interior equation)
+   HYPRE_Complex **aki_array_ptr)   // coefficient a_ki (for each interior equation)
+{
+   HYPRE_Int     *row_indexes;
+   HYPRE_Int      na, *binum_array, *bjnum_array, *aknum_array;
+   HYPRE_Complex *bii_array, *bij_array, *aki_array;
+   HYPRE_Int      i, j, k, m, mkj, anum, bnum, acoeffnum, bcoeffnum;
+   HYPRE_Int      binum, aknum;
+   HYPRE_Complex  bii, bij, aki;
+
+   /* Create the row_indexes array */
+   row_indexes = (HYPRE_Int *)malloc(sizeof(HYPRE_Int) * nrows);
+   row_indexes[0] = 0;
+   for (i = 1; i < nrows; i++)
+   {
+      row_indexes[i] = row_indexes[i-1] + ncols[i-1];
+   }
+
+   /* Assume just one interior equation coupled to each boundary equation */
+   na = nb;
+
+   /* Allocate return arrays */
+   HypreMalloc(binum_array, sizeof(HYPRE_Int) * nb);
+   HypreMalloc(bjnum_array, sizeof(HYPRE_Int) * nb);
+   HypreMalloc(bii_array,   sizeof(HYPRE_Complex) * nb);
+   HypreMalloc(bij_array,   sizeof(HYPRE_Complex) * nb);
+   HypreMalloc(aknum_array, sizeof(HYPRE_Int) * na);
+   HypreMalloc(aki_array,   sizeof(HYPRE_Complex) * na);
+
+   binum = 0;
+   aknum = 0;
+   for (bnum = 0; bnum < nb; bnum++)
+   {
+      /* Get boundary equation information and adjust boundary equations */
+      /* Find row i in rows array (assume i increases and rows is sorted) */
+      i = bi_array[bnum];
+      for (; binum < nrows; binum++)
+      {
+         if (i == rows[binum])
+         {
+            break;   // Found row i in rows array
+         }
+      }
+      bcoeffnum = row_indexes[binum];
+      for (m = 0; m < 2; m++)               // Assume only two boundary equation coefficients
+      {
+         if (cols[bcoeffnum + m] == i)
+         {
+            bii = values[bcoeffnum + m];
+            values[bcoeffnum + m] = -1.0;   // Identity equation (negative definite matrix)
+         }
+         else
+         {
+            j = cols[bcoeffnum + m];
+            bij = values[bcoeffnum + m];
+            values[bcoeffnum + m] = 0.0;   // Identity equation
+         }
+      }
+      ncols[binum] = 1;                  // Identity equation
+
+      /* Get interior equation information and adjust interior equations */
+      /* Find row k in rows array (assume k increases and rows is sorted) */
+      k = j;         // Assume equation k = j
+      for (; aknum < nrows; aknum++)
+      {
+         if (k == rows[aknum])
+         {
+            break;   // Found row k in rows array
+         }
+      }
+      acoeffnum = row_indexes[aknum];
+      for (m = 0; m < ncols[aknum]; m++)
+      {
+         if (cols[acoeffnum + m] == j)
+         {
+            mkj = m;                       // Save for update of akj value below
+         }
+         if (cols[acoeffnum + m] == i)
+         {
+            aki = values[acoeffnum + m];
+            values[acoeffnum + m] = 0.0;   // Eliminate coupling to boundary equation
+         }
+      }
+      values[acoeffnum + mkj] -= aki * bij / bii;   // Update akj value
+
+      /* Update return arrays */
+      anum = bnum;                // Assume only one interior equation k
+      binum_array[bnum] = binum;
+      bjnum_array[bnum] = aknum;  // Assume only one interior equation k
+      bii_array[bnum]   = bii;
+      bij_array[bnum]   = bij;
+      aknum_array[anum] = aknum;
+      aki_array[anum]   = aki;
+   }
+
+   /* Set return arguments */
+   *row_indexes_ptr = row_indexes;
+   *binum_array_ptr = binum_array;
+   *bjnum_array_ptr = bjnum_array;
+   *bii_array_ptr   = bii_array;
+   *bij_array_ptr   = bij_array;
+   *na_ptr          = na;
+   *aknum_array_ptr = aknum_array;
+   *aki_array_ptr   = aki_array;
+
+   return 0;
+}
+
+HYPRE_Int
+AdjustBCRightHandSideEquations(
+   HYPRE_Complex  *rhs,
+   HYPRE_Int       nb,
+   HYPRE_Int      *binum_array,
+   HYPRE_Complex  *bii_array,
+   HYPRE_Complex  *bij_array,
+   HYPRE_Complex **brhs_array_ptr,
+   HYPRE_Int       na,
+   HYPRE_Int      *aknum_array,
+   HYPRE_Complex  *aki_array)
+{
+   HYPRE_Complex *brhs_array;
+   HYPRE_Int      anum, bnum, binum, aknum;
+
+   HypreMalloc(brhs_array, sizeof(HYPRE_Complex) * nb);
+
+   for (bnum = 0; bnum < nb; bnum++)
+   {
+      binum = binum_array[bnum];
+      brhs_array[bnum] = rhs[binum];
+   }
+
+   for (anum = 0; anum < na; anum++)
+   {
+      bnum  = anum;   // Assume only one interior equation per boundary equation
+      aknum = aknum_array[anum];
+      rhs[aknum] -= aki_array[anum] * bij_array[bnum] / bii_array[bnum];
+   }
+
+   *brhs_array_ptr = brhs_array;
+
+   return 0;
+}
+
+HYPRE_Int
+AdjustBCSolutionEquations(
+   HYPRE_Complex  *solution,
+   HYPRE_Int       nb,
+   HYPRE_Int      *binum_array,
+   HYPRE_Int      *bjnum_array,
+   HYPRE_Complex  *bii_array,
+   HYPRE_Complex  *bij_array,
+   HYPRE_Complex  *brhs_array)
+{
+   HYPRE_Int  bnum, binum, bjnum;
+
+   for (bnum = 0; bnum < nb; bnum++)
+   {
+      binum = binum_array[bnum];
+      bjnum = bjnum_array[bnum];
+      solution[binum] = (brhs_array[bnum] - bij_array[bnum] * solution[bjnum]) / bii_array[bnum];
+   }
+
+   return 0;
+}
+
+HYPRE_Int
+AdjustBCEquationsFree(
+   HYPRE_Int     *binum_array,
+   HYPRE_Int     *bjnum_array,
+   HYPRE_Complex *bii_array,
+   HYPRE_Complex *bij_array,
+   HYPRE_Complex *brhs_array,
+   HYPRE_Int     *aknum_array,
+   HYPRE_Complex *aki_array)
+{
+   HypreFree(binum_array);
+   HypreFree(bjnum_array);
+   HypreFree(bii_array);
+   HypreFree(bij_array);
+   HypreFree(brhs_array);
+   HypreFree(aknum_array);
+   HypreFree(aki_array);
+
+   return 0;
+}
+

From 14a621b49efc130e9d5851a3138fc1352a719b18 Mon Sep 17 00:00:00 2001
From: Ben Dudson <dudson2@llnl.gov>
Date: Tue, 4 Mar 2025 17:45:08 -0800
Subject: [PATCH 015/129] elm_pb example: Fix outer boundary phivalue

Should average over Z
---
 examples/elm-pb/elm_pb.cxx | 9 ++++++---
 1 file changed, 6 insertions(+), 3 deletions(-)

diff --git a/examples/elm-pb/elm_pb.cxx b/examples/elm-pb/elm_pb.cxx
index 4c34dee0ad..b36bd728d4 100644
--- a/examples/elm-pb/elm_pb.cxx
+++ b/examples/elm-pb/elm_pb.cxx
@@ -1410,11 +1410,14 @@ class ELMpb : public PhysicsModel {
           if (mesh->lastX()) {
             for (int j = mesh->ystart; j <= mesh->yend; j++) {
               BoutReal phivalue = 0.0;
-              BoutReal oldvalue = 0.0;
               for (int k = 0; k < mesh->LocalNz; k++) {
-                phivalue = phi(mesh->xend, j, k);
-                oldvalue = 0.5 * (phi(mesh->xend + 1, j, k) + phi(mesh->xend, j, k));
+                phivalue += phi(mesh->xend, j, k);
               }
+              phivalue /= mesh->LocalNz; // Average in Z of point next to boundary
+
+              // Old value of phi at boundary. Note: this is constant in Z
+              BoutReal oldvalue =
+                  0.5 * (phi(mesh->xend + 1, j, 0) + phi(mesh->xend, j, 0));
 
               // New value of phi at boundary, relaxing towards phivalue
               BoutReal newvalue = weight * oldvalue + (1. - weight) * phivalue;

From e3f4a98ac6235b0bef6ffc4d90ec2da2f1ecb668 Mon Sep 17 00:00:00 2001
From: Rob Falgout <rfalgout@llnl.gov>
Date: Wed, 5 Mar 2025 08:35:17 -0800
Subject: [PATCH 016/129] Added HYPRE GMRES SetKDim call.  Need to make this an
 input file parameter.

---
 include/bout/hypre_interface.hxx | 16 ++++++++++++++++
 1 file changed, 16 insertions(+)

diff --git a/include/bout/hypre_interface.hxx b/include/bout/hypre_interface.hxx
index 72eec916e2..efb620241e 100644
--- a/include/bout/hypre_interface.hxx
+++ b/include/bout/hypre_interface.hxx
@@ -1067,6 +1067,22 @@ public:
     setMaxIter(
         options["maxits"].doc("Maximum iterations for Hypre solver").withDefault(10000));
 
+    switch (solver_type) {
+    case HYPRE_SOLVER_TYPE::gmres: {
+       HYPRE_ParCSRGMRESSetKDim(solver, 30);  // TODO: Make this an input file parameter
+      break;
+    }
+    case HYPRE_SOLVER_TYPE::bicgstab: {
+      break;
+    }
+    case HYPRE_SOLVER_TYPE::pcg: {
+      break;
+    }
+    default: {
+      throw BoutException("Unsupported hypre_solver_type {}", toString(solver_type));
+    }
+    }
+
     HYPRE_BoomerAMGCreate(&precon);
     HYPRE_BoomerAMGSetOldDefault(precon);
 #if BOUT_HAS_CUDA

From ef069675e39a6e92355036c45f3f20183a67e628 Mon Sep 17 00:00:00 2001
From: Rob Falgout <rfalgout@llnl.gov>
Date: Wed, 5 Mar 2025 09:53:21 -0800
Subject: [PATCH 017/129] Added code to free up data.  The HypreMatrix destroy
 needs to be updated.

---
 examples/elm-pb/elm_pb.cxx                    | 134 ++++++++++++++----
 include/bout/hypre_interface.hxx              |  41 +++---
 .../laplace/impls/hypre3d/hypre_boundary.c    |  35 +----
 3 files changed, 129 insertions(+), 81 deletions(-)

diff --git a/examples/elm-pb/elm_pb.cxx b/examples/elm-pb/elm_pb.cxx
index f830f3d98a..c332edd223 100644
--- a/examples/elm-pb/elm_pb.cxx
+++ b/examples/elm-pb/elm_pb.cxx
@@ -46,6 +46,7 @@ class ELMpb : public PhysicsModel {
   Coordinates::FieldMetric U0; // 0th vorticity of equilibrium flow,
   // radial flux coordinate, normalized radial flux coordinate
 
+  bool laplace_perp;    // Use Laplace_perp or Delp2?
   bool constn0;
   // the total height, average width and center of profile of N0
   BoutReal n0_height, n0_ave, n0_width, n0_center, n0_bottom_x, Nbar, Tibar, Tebar;
@@ -350,7 +351,8 @@ class ELMpb : public PhysicsModel {
     //////////////////////////////////////////////////////////////
     auto& globalOptions = Options::root();
     auto& options = globalOptions["highbeta"];
-
+    laplace_perp = options["laplace_perp"].withDefault(false);    
+    // Use Laplace_perp rather than Delp2
     constn0 = options["constn0"].withDefault(true);
     // use the hyperbolic profile of n0. If both  n0_fake_prof and
     // T0_fake_prof are false, use the profiles from grid file
@@ -1315,7 +1317,11 @@ class ELMpb : public PhysicsModel {
       Ctmp.applyBoundary();
       Ctmp -= phi; // Now contains error in the boundary
 
-      C_phi = Delp2(phi) - U; // Error in the bulk
+      if (laplace_perp) {
+        C_phi = Laplace_perp(phi) - U; // Error in the bulk
+      } else {
+        C_phi = Delp2(phi) - U; // Error in the bulk
+      }
       C_phi.setBoundaryTo(Ctmp);
 
     } else {
@@ -1347,8 +1353,12 @@ class ELMpb : public PhysicsModel {
       } else {
         ubyn = U / N0;
         if (diamag) {
-          ubyn -= 0.5 * dnorm / (N0 * B0) * Delp2(P);
-          mesh->communicate(ubyn);
+          if (laplace_perp) {
+            ubyn -= 0.5 * dnorm / (N0 * B0) * Laplace_perp(P);
+	  } else {
+            ubyn -= 0.5 * dnorm / (N0 * B0) * Delp2(P); 
+	  }
+	  mesh->communicate(ubyn);
         }
         // Invert laplacian for phi
         phiSolver->setCoefC(N0);
@@ -1361,9 +1371,18 @@ class ELMpb : public PhysicsModel {
 
     if (!evolve_jpar) {
       // Get J from Psi
-      Jpar = Delp2(Psi);
+      if (laplace_perp) {
+        Jpar = Laplace_perp(Psi);
+      } else {
+        Jpar = Delp2(Psi);
+      }
+
       if (include_rmp) {
-        Jpar += Delp2(rmp_Psi);
+        if (laplace_perp) {	
+          Jpar += Laplace_perp(rmp_Psi);
+	} else {
+          Jpar += Delp2(rmp_Psi);
+	}
       }
 
       Jpar.applyBoundary();
@@ -1397,8 +1416,11 @@ class ELMpb : public PhysicsModel {
       }
 
       // Get Delp2(J) from J
-      Jpar2 = Delp2(Jpar);
-
+      if (laplace_perp) {	
+        Jpar2 = Laplace_perp(Jpar);
+      } else {
+        Jpar2 = Delp2(Jpar);
+      }
       Jpar2.applyBoundary();
       mesh->communicate(Jpar2);
 
@@ -1494,7 +1516,11 @@ class ELMpb : public PhysicsModel {
       // Jpar
       Field3D B0U = B0 * U;
       mesh->communicate(B0U);
-      ddt(Jpar) = -Grad_parP(B0U, loc) / B0 + eta * Delp2(Jpar);
+      if (laplace_perp) {
+        ddt(Jpar) = -Grad_parP(B0U, loc) / B0 + eta * Laplace_perp(Jpar);
+      }else {
+        ddt(Jpar) = -Grad_parP(B0U, loc) / B0 + eta * Delp2(Jpar);
+      }
 
       if (relax_j_vac) {
         // Make ddt(Jpar) relax to zero.
@@ -1524,11 +1550,19 @@ class ELMpb : public PhysicsModel {
       }
 
       if (hyperresist > 0.0) { // Hyper-resistivity
-        ddt(Psi) -= eta * hyperresist * Delp2(Jpar);
+        if (laplace_perp) {
+          ddt(Psi) -= eta * hyperresist * Laplace_perp(Jpar);
+	} else {
+          ddt(Psi) -= eta * hyperresist * Delp2(Jpar);	
+	}
       }
 
       if (ehyperviscos > 0.0) { // electron Hyper-viscosity coefficient
-        ddt(Psi) -= eta * ehyperviscos * Delp2(Jpar2);
+        if (laplace_perp) {
+          ddt(Psi) -= eta * ehyperviscos * Laplace_perp(Jpar2);
+	} else {
+          ddt(Psi) -= eta * ehyperviscos * Delp2(Jpar2);
+	}
       }
 
       // Parallel hyper-viscous diffusion for vector potential
@@ -1599,7 +1633,11 @@ class ELMpb : public PhysicsModel {
     }
 
     if (viscos_perp > 0.0) {
-      ddt(U) += viscos_perp * Delp2(U); // Perpendicular viscosity
+      if (laplace_perp) {
+        ddt(U) += viscos_perp * Laplace_perp(U); // Perpendicular viscosity
+      } else {
+        ddt(U) += viscos_perp * Delp2(U); // Perpendicular viscosity
+      }
     }
 
     // Hyper-viscosity
@@ -1626,21 +1664,40 @@ class ELMpb : public PhysicsModel {
       Pi = 0.5 * P;
       Pi0 = 0.5 * P0;
 
-      Dperp2Phi0 = Field3D(Delp2(B0 * phi0));
-      Dperp2Phi0.applyBoundary();
-      mesh->communicate(Dperp2Phi0);
+      if (laplace_perp) {
+        Dperp2Phi0 = Field3D(Laplace_perp(B0 * phi0));
+        Dperp2Phi0.applyBoundary();
+        mesh->communicate(Dperp2Phi0);
 
-      Dperp2Phi = Delp2(B0 * phi);
-      Dperp2Phi.applyBoundary();
-      mesh->communicate(Dperp2Phi);
+        Dperp2Phi = Laplace_perp(B0 * phi);
+        Dperp2Phi.applyBoundary();
+        mesh->communicate(Dperp2Phi);
 
-      Dperp2Pi0 = Field3D(Delp2(Pi0));
-      Dperp2Pi0.applyBoundary();
-      mesh->communicate(Dperp2Pi0);
+        Dperp2Pi0 = Field3D(Laplace_perp(Pi0));
+        Dperp2Pi0.applyBoundary();
+        mesh->communicate(Dperp2Pi0);
 
-      Dperp2Pi = Delp2(Pi);
-      Dperp2Pi.applyBoundary();
-      mesh->communicate(Dperp2Pi);
+        Dperp2Pi = Laplace_perp(Pi);
+        Dperp2Pi.applyBoundary();
+        mesh->communicate(Dperp2Pi);
+      } else {
+        Dperp2Phi0 = Field3D(Delp2(B0 * phi0));
+        Dperp2Phi0.applyBoundary();
+        mesh->communicate(Dperp2Phi0);
+
+        Dperp2Phi = Delp2(B0 * phi);
+        Dperp2Phi.applyBoundary();
+        mesh->communicate(Dperp2Phi);
+
+        Dperp2Pi0 = Field3D(Delp2(Pi0));
+        Dperp2Pi0.applyBoundary();
+        mesh->communicate(Dperp2Pi0);
+
+        Dperp2Pi = Delp2(Pi);
+        Dperp2Pi.applyBoundary();
+        mesh->communicate(Dperp2Pi);
+      
+      }
 
       bracketPhi0P = bracket(B0 * phi0, Pi, bm_exb);
       bracketPhi0P.applyBoundary();
@@ -1658,8 +1715,13 @@ class ELMpb : public PhysicsModel {
       mesh->communicate(B0phi0);
       ddt(U) += 0.5 * Upara2 * bracket(B0phi, Dperp2Pi0, bm_exb) / B0;
       ddt(U) += 0.5 * Upara2 * bracket(B0phi0, Dperp2Pi, bm_exb) / B0;
-      ddt(U) -= 0.5 * Upara2 * Delp2(bracketPhi0P) / B0;
-      ddt(U) -= 0.5 * Upara2 * Delp2(bracketPhiP0) / B0;
+      if (laplace_perp) {
+        ddt(U) -= 0.5 * Upara2 * Laplace_perp(bracketPhi0P) / B0;
+        ddt(U) -= 0.5 * Upara2 * Laplace_perp(bracketPhiP0) / B0;
+      } else {
+        ddt(U) -= 0.5 * Upara2 * Delp2(bracketPhi0P) / B0;
+        ddt(U) -= 0.5 * Upara2 * Delp2(bracketPhiP0) / B0;
+      }
 
       if (nonlinear) {
         Field3D B0phi = B0 * phi;
@@ -1670,7 +1732,11 @@ class ELMpb : public PhysicsModel {
 
         ddt(U) -= 0.5 * Upara2 * bracket(Pi, Dperp2Phi, bm_exb) / B0;
         ddt(U) += 0.5 * Upara2 * bracket(B0phi, Dperp2Pi, bm_exb) / B0;
-        ddt(U) -= 0.5 * Upara2 * Delp2(bracketPhiP) / B0;
+        if (laplace_perp) {
+          ddt(U) -= 0.5 * Upara2 * Laplace_perp(bracketPhiP) / B0;
+	} else {
+  	  ddt(U) -= 0.5 * Upara2 * Delp2(bracketPhiP) / B0;
+	}
       }
     }
 
@@ -1808,7 +1874,12 @@ class ELMpb : public PhysicsModel {
   int precon(BoutReal UNUSED(t), BoutReal gamma, BoutReal UNUSED(delta)) {
     // First matrix, applying L
     mesh->communicate(ddt(Psi));
-    Field3D Jrhs = Delp2(ddt(Psi));
+    Field3D Jrhs;
+    if (laplace_perp) {	
+      Jrhs = Laplace_perp(ddt(Psi));
+    } else {
+      Jrhs = Delp2(ddt(Psi));
+    }
     Jrhs.applyBoundary("neumann");
 
     if (jpar_bndry_width > 0) {
@@ -1880,8 +1951,11 @@ class ELMpb : public PhysicsModel {
 
     phi = phiSolver->solve(ddt(U));
 
-    Jpar = Delp2(ddt(Psi));
-
+    if (laplace_perp) {	
+      Jpar = Laplace_perp(ddt(Psi));
+    } else {
+      Jpar = Delp2(ddt(Psi));
+    }
     mesh->communicate(phi, Jpar);
 
     Field3D JP = -b0xGrad_dot_Grad(phi, P0);
diff --git a/include/bout/hypre_interface.hxx b/include/bout/hypre_interface.hxx
index efb620241e..0025ed062b 100644
--- a/include/bout/hypre_interface.hxx
+++ b/include/bout/hypre_interface.hxx
@@ -20,7 +20,7 @@
 #include "HYPRE_utilities.h"
 #include "_hypre_utilities.h"
 
-HYPRE_Int
+void
 AdjustBCMatrixEquations(
    HYPRE_Int       nrows,
    HYPRE_Int      *ncols,
@@ -38,7 +38,7 @@ AdjustBCMatrixEquations(
    HYPRE_Int     **aknum_array_ptr, // data index for row k (for each interior equation)
    HYPRE_Complex **aki_array_ptr);  // coefficient a_ki (for each interior equation)
 
-HYPRE_Int
+void
 AdjustBCRightHandSideEquations(
    HYPRE_Complex  *rhs,
    HYPRE_Int       nb,
@@ -50,7 +50,7 @@ AdjustBCRightHandSideEquations(
    HYPRE_Int      *aknum_array,
    HYPRE_Complex  *aki_array);
 
-HYPRE_Int
+void
 AdjustBCSolutionEquations(
    HYPRE_Complex  *solution,
    HYPRE_Int       nb,
@@ -60,16 +60,6 @@ AdjustBCSolutionEquations(
    HYPRE_Complex  *bij_array,
    HYPRE_Complex  *brhs_array);
 
-HYPRE_Int
-AdjustBCEquationsFree(
-   HYPRE_Int     *binum_array,
-   HYPRE_Int     *bjnum_array,
-   HYPRE_Complex *bii_array,
-   HYPRE_Complex *bij_array,
-   HYPRE_Complex *brhs_array,
-   HYPRE_Int     *aknum_array,
-   HYPRE_Complex *aki_array);
-
 #include <memory>
 
 // BOUT_ENUM_CLASS does not work inside namespaces
@@ -136,6 +126,9 @@ public:
     checkHypreError(HYPRE_IJVectorDestroy(hypre_vector));
     HypreFree(I);
     HypreFree(V);
+    if (elimBErhs) {
+      HypreFree(brhs_array);
+    }
   }
 
   // Disable copy, at least for now: not clear that HYPRE_IJVector is
@@ -251,8 +244,7 @@ public:
   }
 
   void writeCacheToHypre() {
-    if (elimBErhs)
-    {
+    if (elimBErhs) {
       AdjustBCRightHandSideEquations(V, nb, binum_array, bii_array, bij_array, &brhs_array,
                                      na, aknum_array, aki_array);
     }
@@ -261,8 +253,7 @@ public:
 
   void readCacheFromHypre() {
     checkHypreError(HYPRE_IJVectorGetValues(hypre_vector, vsize, I, V));
-    if (elimBEsol)
-    {
+    if (elimBEsol) {
       AdjustBCSolutionEquations(V, nb, binum_array, bjnum_array, bii_array, bij_array, brhs_array);
     }
   }
@@ -419,6 +410,19 @@ public:
   using ind_type = typename T::ind_type;
 
   HypreMatrix() = default;
+//  The 'if' block below needs to be called when the HypreMatrix is destroyed,
+//  but I don't know where to put it.  The HypreMatrix class is handled
+//  differently from HypreVector.
+//  ~HypreVector() {
+//    if (elimBE) {
+//      HypreFree(binum_array);
+//      HypreFree(bjnum_array);
+//      HypreFree(bii_array);
+//      HypreFree(bij_array);
+//      HypreFree(aknum_array);
+//      HypreFree(aki_array);
+//    }
+//  }
   HypreMatrix(const HypreMatrix<T>&) = delete;
   HypreMatrix(HypreMatrix<T>&& other)
       : comm(other.comm), ilower(other.ilower), iupper(other.iupper),
@@ -811,8 +815,7 @@ public:
     }
 
     // Eliminate boundary condition equations in hypre SetValues input arguments
-    if (elimBE)
-    {
+    if (elimBE) {
       HYPRE_Int *bi_array;
       HYPRE_Int *row_indexes;
       // There must be an easier way to get nb
diff --git a/src/invert/laplace/impls/hypre3d/hypre_boundary.c b/src/invert/laplace/impls/hypre3d/hypre_boundary.c
index c4e7393c3f..69e9a2d1b0 100644
--- a/src/invert/laplace/impls/hypre3d/hypre_boundary.c
+++ b/src/invert/laplace/impls/hypre3d/hypre_boundary.c
@@ -10,8 +10,6 @@
  * returns info needed to adjust the right-hand-side and solution vector through
  * the functions AdjustRightHandSideEquations and AdjustSolutionEquations.
  *
- * Returned info arrays can be freed with the function AdjustEquationsFree().
- *
  * NOTE: It may make sense from an organizational standpoint to collect many of
  * these arguments in a structure of some sort.
  *
@@ -49,7 +47,7 @@
  *   the coefficient for b_ij.
  */
 
-HYPRE_Int
+void
 AdjustBCMatrixEquations(
    HYPRE_Int       nrows,
    HYPRE_Int      *ncols,
@@ -168,11 +166,9 @@ AdjustBCMatrixEquations(
    *na_ptr          = na;
    *aknum_array_ptr = aknum_array;
    *aki_array_ptr   = aki_array;
-
-   return 0;
 }
 
-HYPRE_Int
+void
 AdjustBCRightHandSideEquations(
    HYPRE_Complex  *rhs,
    HYPRE_Int       nb,
@@ -203,11 +199,9 @@ AdjustBCRightHandSideEquations(
    }
 
    *brhs_array_ptr = brhs_array;
-
-   return 0;
 }
 
-HYPRE_Int
+void
 AdjustBCSolutionEquations(
    HYPRE_Complex  *solution,
    HYPRE_Int       nb,
@@ -225,28 +219,5 @@ AdjustBCSolutionEquations(
       bjnum = bjnum_array[bnum];
       solution[binum] = (brhs_array[bnum] - bij_array[bnum] * solution[bjnum]) / bii_array[bnum];
    }
-
-   return 0;
-}
-
-HYPRE_Int
-AdjustBCEquationsFree(
-   HYPRE_Int     *binum_array,
-   HYPRE_Int     *bjnum_array,
-   HYPRE_Complex *bii_array,
-   HYPRE_Complex *bij_array,
-   HYPRE_Complex *brhs_array,
-   HYPRE_Int     *aknum_array,
-   HYPRE_Complex *aki_array)
-{
-   HypreFree(binum_array);
-   HypreFree(bjnum_array);
-   HypreFree(bii_array);
-   HypreFree(bij_array);
-   HypreFree(brhs_array);
-   HypreFree(aknum_array);
-   HypreFree(aki_array);
-
-   return 0;
 }
 

From 67660069a1bd2174bdc36a0750f8a9d79b0a88a9 Mon Sep 17 00:00:00 2001
From: Ben Dudson <dudson2@llnl.gov>
Date: Wed, 5 Mar 2025 12:11:45 -0800
Subject: [PATCH 018/129] hypre_interface: Wrap BC arrays in structs &
 shared_ptr

Use structs to group together arrays for boundary row elimination.
Coefficients from HypreMatrix are stored in one struct, using a
shared_ptr to share values with vectors.

Eliminated boundary row values need to be passed from RHS to solution
vector. This now uses a shared pointer that will manage the HypreFree
call.
---
 include/bout/hypre_interface.hxx | 202 ++++++++++++++-----------------
 1 file changed, 93 insertions(+), 109 deletions(-)

diff --git a/include/bout/hypre_interface.hxx b/include/bout/hypre_interface.hxx
index 0025ed062b..7ad50a008d 100644
--- a/include/bout/hypre_interface.hxx
+++ b/include/bout/hypre_interface.hxx
@@ -98,6 +98,82 @@ int checkHypreError(int error) {
 // TODO: set sizes
 // TODO: set contiguous blocks at once
 
+/// Wrapper around HYPRE_Complex, that calls HypreFree when destroyed.
+struct HypreComplexArray {
+  HYPRE_Complex *data;
+
+  ~HypreComplexArray() {
+    HypreFree(data);
+  }
+};
+
+/// Shared pointter to a HypreComplexArray. When the last copy is destroyed
+/// the HYPRE_Complex array inside will be free'd.
+using BCValuesPtr = std::shared_ptr<HypreComplexArray>;
+
+/// Contains information needed to eliminate boundary equations from
+/// RHS vectors, and restore boundary values in solution vectors.
+struct BCMatrixEquations {
+  HYPRE_Int      nb;
+  HYPRE_Int     *binum_array;
+  HYPRE_Int     *bjnum_array;
+  HYPRE_Complex *bii_array;
+  HYPRE_Complex *bij_array;
+  HYPRE_Int      na;
+  HYPRE_Int     *aknum_array;
+  HYPRE_Complex *aki_array;
+
+  BCMatrixEquations() = delete;
+
+  BCMatrixEquations(HYPRE_Int       nrows,
+                    HYPRE_Int      *ncols,
+                    HYPRE_BigInt   *rows,
+                    HYPRE_Int     **row_indexes_ptr,
+                    HYPRE_BigInt   *cols,
+                    HYPRE_Complex  *values,
+                    HYPRE_Int       nb,             // number of boundary equations
+                    HYPRE_Int      *bi_array)       // row i for each boundary equation
+    : nb(nb) {
+    AdjustBCMatrixEquations(nrows, ncols, rows, row_indexes_ptr, cols, values,
+                            nb, bi_array,
+                            // Outputs
+                            &binum_array, &bjnum_array, &bii_array, &bij_array,
+                            &na, &aknum_array, &aki_array);
+  }
+
+  ~BCMatrixEquations() {
+    // Free arrays
+    HypreFree(binum_array);
+    HypreFree(bjnum_array);
+    HypreFree(bii_array);
+    HypreFree(bij_array);
+    HypreFree(aknum_array);
+    HypreFree(aki_array);
+  }
+
+  /// Applies in-place modification of the rhs array.
+  ///
+  /// Returns an array of boundary values that can be used to apply
+  /// boundary conditions to a solution vector.
+  BCValuesPtr adjustBCRightHandSideEquations(HYPRE_Complex *rhs) {
+    BCValuesPtr brhs = std::make_shared<HypreComplexArray>();
+    AdjustBCRightHandSideEquations(rhs, nb, binum_array, bii_array, bij_array, &brhs->data,
+                                   na, aknum_array, aki_array);
+    return brhs;
+  }
+
+  /// Apply boundary conditions to the solution.
+  /// Uses the BCValuesPtr returned from adjustBCRightHandSideEquations()
+  void adjustBCSolutionEquations(BCValuesPtr brhs, HYPRE_Complex *solution) {
+    AdjustBCSolutionEquations(solution, nb,
+                              binum_array, bjnum_array, bii_array, bij_array, brhs->data);
+  }
+};
+
+/// A shared pointer to a BCMatrixEquations object
+using BCMatrixPtr = std::shared_ptr<BCMatrixEquations>;
+
+
 template <class T>
 class HypreVector {
   MPI_Comm comm;
@@ -126,9 +202,6 @@ public:
     checkHypreError(HYPRE_IJVectorDestroy(hypre_vector));
     HypreFree(I);
     HypreFree(V);
-    if (elimBErhs) {
-      HypreFree(brhs_array);
-    }
   }
 
   // Disable copy, at least for now: not clear that HYPRE_IJVector is
@@ -217,22 +290,14 @@ public:
     HypreMalloc(V, vsize * sizeof(HYPRE_Complex));
   }
 
-  // Data for eliminating boundary equations (TODO: convert this to a structure)
+  // Data for eliminating boundary equation
   bool elimBErhs = false;
   bool elimBEsol = false;
-  HYPRE_Complex *rhs;
-  HYPRE_Int      nb;
-  HYPRE_Int     *binum_array;
-  HYPRE_Int     *bjnum_array;
-  HYPRE_Complex *bii_array;
-  HYPRE_Complex *bij_array;
-  HYPRE_Complex *brhs_array; // This is not created from the HypreMatrix class
-  HYPRE_Int      na;
-  HYPRE_Int     *aknum_array;
-  HYPRE_Complex *aki_array;
+  BCMatrixPtr bcmatrix;
+  BCValuesPtr bcvalues;  /// Stores rhs values of BC rows
 
   void syncElimBErhs(HypreVector<T>& rhs) {
-    brhs_array = rhs.brhs_array;
+    bcvalues = rhs.bcvalues;
   }
 
   void assemble() {
@@ -245,8 +310,7 @@ public:
 
   void writeCacheToHypre() {
     if (elimBErhs) {
-      AdjustBCRightHandSideEquations(V, nb, binum_array, bii_array, bij_array, &brhs_array,
-                                     na, aknum_array, aki_array);
+      bcvalues = bcmatrix->adjustBCRightHandSideEquations(V);
     }
     checkHypreError(HYPRE_IJVectorSetValues(hypre_vector, vsize, I, V));
   }
@@ -254,7 +318,7 @@ public:
   void readCacheFromHypre() {
     checkHypreError(HYPRE_IJVectorGetValues(hypre_vector, vsize, I, V));
     if (elimBEsol) {
-      AdjustBCSolutionEquations(V, nb, binum_array, bjnum_array, bii_array, bij_array, brhs_array);
+      bcmatrix->adjustBCSolutionEquations(bcvalues, V);
     }
   }
 
@@ -410,19 +474,6 @@ public:
   using ind_type = typename T::ind_type;
 
   HypreMatrix() = default;
-//  The 'if' block below needs to be called when the HypreMatrix is destroyed,
-//  but I don't know where to put it.  The HypreMatrix class is handled
-//  differently from HypreVector.
-//  ~HypreVector() {
-//    if (elimBE) {
-//      HypreFree(binum_array);
-//      HypreFree(bjnum_array);
-//      HypreFree(bii_array);
-//      HypreFree(bij_array);
-//      HypreFree(aknum_array);
-//      HypreFree(aki_array);
-//    }
-//  }
   HypreMatrix(const HypreMatrix<T>&) = delete;
   HypreMatrix(HypreMatrix<T>&& other)
       : comm(other.comm), ilower(other.ilower), iupper(other.iupper),
@@ -748,16 +799,9 @@ public:
     return Element(*this, global_row, global_column, positions, weights);
   }
 
-  // Data for eliminating boundary equations (TODO: convert this to a structure)
+  // Data for eliminating boundary equations
   bool elimBE = false;
-  HYPRE_Int      nb;
-  HYPRE_Int     *binum_array;
-  HYPRE_Int     *bjnum_array;
-  HYPRE_Complex *bii_array;
-  HYPRE_Complex *bij_array;
-  HYPRE_Int      na;
-  HYPRE_Int     *aknum_array;
-  HYPRE_Complex *aki_array;
+  BCMatrixPtr bcmatrix; // Shared pointer
 
   void setElimBE() {
     elimBE = true;
@@ -765,24 +809,10 @@ public:
 
   void setElimBEVectors(HypreVector<T>& sol, HypreVector<T>& rhs) {
     sol.elimBEsol = elimBE;
-    sol.nb          = nb;
-    sol.binum_array = binum_array;
-    sol.bjnum_array = bjnum_array;
-    sol.bii_array   = bii_array;
-    sol.bij_array   = bij_array;
-    sol.na          = na;
-    sol.aknum_array = aknum_array;
-    sol.aki_array   = aki_array;
+    sol.bcmatrix = bcmatrix;
 
     rhs.elimBErhs = elimBE;
-    rhs.nb          = nb;
-    rhs.binum_array = binum_array;
-    rhs.bjnum_array = bjnum_array;
-    rhs.bii_array   = bii_array;
-    rhs.bij_array   = bij_array;
-    rhs.na          = na;
-    rhs.aknum_array = aknum_array;
-    rhs.aki_array   = aki_array;
+    rhs.bcmatrix = bcmatrix;
   }
 
   void assemble() {
@@ -819,7 +849,7 @@ public:
       HYPRE_Int *bi_array;
       HYPRE_Int *row_indexes;
       // There must be an easier way to get nb
-      nb = 0;
+      int nb = 0;
       BOUT_FOR_SERIAL(i, index_converter->getRegionBndry()) {
          nb++;
       }
@@ -829,59 +859,13 @@ public:
          bi_array[nb] = index_converter->getGlobal(i);
          nb++;
       }
-      AdjustBCMatrixEquations(num_rows, num_cols, rawI, &row_indexes, cols, vals,
-                              nb, bi_array,
-                              &binum_array, &bjnum_array, &bii_array, &bij_array,
-                              &na, &aknum_array, &aki_array);
+
+      bcmatrix = std::make_shared<BCMatrixEquations>(num_rows, num_cols,
+                                                     rawI, &row_indexes,
+                                                     cols, vals,
+                                                     nb, bi_array);
       HypreFree(bi_array);
-//    {
-//       FILE  *file;
-//       int    i;
-//       file = fopen("zbout.setvalues.out2", "w");
-//       fprintf(file, "nrows %d\n", num_rows);
-//       for (i = 0; i < num_rows; i++)
-//       {
-//          fprintf(file, "ncols %d: %d\n", i, num_cols[i]);
-//       }
-//       for (i = 0; i < num_rows; i++)
-//       {
-//          fprintf(file, "rows %d: %d\n", i, rawI[i]);
-//       }
-//       for (i = 0; i < num_entries; i++)
-//       {
-//          fprintf(file, "cols %d: %d\n", i, cols[i]);
-//       }
-//       for (i = 0; i < num_entries; i++)
-//       {
-//          fprintf(file, "vals %d: %f\n", i, vals[i]);
-//       }
-//       fclose(file);
-//
-//       file = fopen("zbout.setvalues.out3", "w");
-//       for (i = 0; i < num_rows; i++)
-//       {
-//          fprintf(file, "row_indexes %d: %d\n", i, row_indexes[i]);
-//       }
-//       fprintf(file, "nb %d\n", nb);
-//       for (i = 0; i < nb; i++)
-//       {
-//          fprintf(file, "bijnum_array %d: %d %d\n", i, binum_array[i], bjnum_array[i]);
-//       }
-//       for (i = 0; i < nb; i++)
-//       {
-//          fprintf(file, "biiij_array %d: %f %f\n", i, bii_array[i], bij_array[i]);
-//       }
-//       fprintf(file, "na %d\n", na);
-//       for (i = 0; i < na; i++)
-//       {
-//          fprintf(file, "aknum_array %d: %d\n", i, aknum_array[i]);
-//       }
-//       for (i = 0; i < na; i++)
-//       {
-//          fprintf(file, "bki_array %d: %f\n", i, aki_array[i]);
-//       }
-//       fclose(file);
-//    }
+
       checkHypreError(
         HYPRE_IJMatrixSetValues2(*hypre_matrix, num_rows, num_cols, rawI, row_indexes, cols, vals));
       HypreFree(row_indexes);

From 29b65c592a229b122da3660fe98a40a23d1f3ed5 Mon Sep 17 00:00:00 2001
From: Rob Falgout <rfalgout@llnl.gov>
Date: Wed, 5 Mar 2025 12:40:04 -0800
Subject: [PATCH 019/129] Fixed a bug in rhs update for boundary elimination
 code

---
 include/bout/hypre_interface.hxx                  | 3 +--
 src/invert/laplace/impls/hypre3d/hypre_boundary.c | 3 +--
 2 files changed, 2 insertions(+), 4 deletions(-)

diff --git a/include/bout/hypre_interface.hxx b/include/bout/hypre_interface.hxx
index 7ad50a008d..c8377f7f5a 100644
--- a/include/bout/hypre_interface.hxx
+++ b/include/bout/hypre_interface.hxx
@@ -44,7 +44,6 @@ AdjustBCRightHandSideEquations(
    HYPRE_Int       nb,
    HYPRE_Int      *binum_array,
    HYPRE_Complex  *bii_array,
-   HYPRE_Complex  *bij_array,
    HYPRE_Complex **brhs_array_ptr,
    HYPRE_Int       na,
    HYPRE_Int      *aknum_array,
@@ -157,7 +156,7 @@ struct BCMatrixEquations {
   /// boundary conditions to a solution vector.
   BCValuesPtr adjustBCRightHandSideEquations(HYPRE_Complex *rhs) {
     BCValuesPtr brhs = std::make_shared<HypreComplexArray>();
-    AdjustBCRightHandSideEquations(rhs, nb, binum_array, bii_array, bij_array, &brhs->data,
+    AdjustBCRightHandSideEquations(rhs, nb, binum_array, bii_array, &brhs->data,
                                    na, aknum_array, aki_array);
     return brhs;
   }
diff --git a/src/invert/laplace/impls/hypre3d/hypre_boundary.c b/src/invert/laplace/impls/hypre3d/hypre_boundary.c
index 69e9a2d1b0..30f0968765 100644
--- a/src/invert/laplace/impls/hypre3d/hypre_boundary.c
+++ b/src/invert/laplace/impls/hypre3d/hypre_boundary.c
@@ -174,7 +174,6 @@ AdjustBCRightHandSideEquations(
    HYPRE_Int       nb,
    HYPRE_Int      *binum_array,
    HYPRE_Complex  *bii_array,
-   HYPRE_Complex  *bij_array,
    HYPRE_Complex **brhs_array_ptr,
    HYPRE_Int       na,
    HYPRE_Int      *aknum_array,
@@ -195,7 +194,7 @@ AdjustBCRightHandSideEquations(
    {
       bnum  = anum;   // Assume only one interior equation per boundary equation
       aknum = aknum_array[anum];
-      rhs[aknum] -= aki_array[anum] * bij_array[bnum] / bii_array[bnum];
+      rhs[aknum] -= aki_array[anum] * brhs_array[bnum] / bii_array[bnum];
    }
 
    *brhs_array_ptr = brhs_array;

From 62b923b0a40ebdd80b3a25ab0da4ebb76889c72a Mon Sep 17 00:00:00 2001
From: Ben Dudson <dudson2@llnl.gov>
Date: Wed, 5 Mar 2025 14:50:31 -0800
Subject: [PATCH 020/129] FCITransform: Save R and Z coordinates to output

Reads cell center coordinates from the mesh, and saves to the output.
This is to facilitate code coupling and visualisation.
---
 src/mesh/parallel/fci.cxx |  6 ++++++
 src/mesh/parallel/fci.hxx | 13 ++++++++++++-
 2 files changed, 18 insertions(+), 1 deletion(-)

diff --git a/src/mesh/parallel/fci.cxx b/src/mesh/parallel/fci.cxx
index acd4954f97..659df8600d 100644
--- a/src/mesh/parallel/fci.cxx
+++ b/src/mesh/parallel/fci.cxx
@@ -346,3 +346,9 @@ void FCITransform::integrateParallelSlices(Field3D& f) {
     f.ynext(map.offset) = map.integrate(f);
   }
 }
+
+void FCITransform::outputVars(Options& output_options) {
+  // Real-space coordinates of grid points
+  output_options["R"].force(R, "FCI");
+  output_options["Z"].force(Z, "FCI");
+}
diff --git a/src/mesh/parallel/fci.hxx b/src/mesh/parallel/fci.hxx
index 3ec3321a6a..1a02f558e1 100644
--- a/src/mesh/parallel/fci.hxx
+++ b/src/mesh/parallel/fci.hxx
@@ -73,11 +73,15 @@ public:
   FCITransform() = delete;
   FCITransform(Mesh& mesh, const Coordinates::FieldMetric& dy, bool zperiodic = true,
                Options* opt = nullptr)
-      : ParallelTransform(mesh, opt) {
+    : ParallelTransform(mesh, opt), R{&mesh}, Z{&mesh} {
 
     // check the coordinate system used for the grid data source
     FCITransform::checkInputGrid();
 
+    // Real-space coordinates of grid cells
+    mesh.get(R, "R", 0.0, false);
+    mesh.get(Z, "Z", 0.0, false);
+
     auto forward_boundary_xin =
         std::make_shared<BoundaryRegionPar>("FCI_forward", BNDRY_PAR_FWD_XIN, +1, &mesh);
     auto backward_boundary_xin = std::make_shared<BoundaryRegionPar>(
@@ -142,6 +146,10 @@ public:
 
   bool canToFromFieldAligned() const override { return false; }
 
+  /// Save mesh variables to output
+  /// If R and Z(x,y,z) coordinates are in the input then these are saved to output.
+  void outputVars(Options& output_options) override;
+
   bool requiresTwistShift(bool UNUSED(twist_shift_enabled),
                           [[maybe_unused]] YDirectionType ytype) override {
     // No Field3Ds require twist-shift, because they cannot be field-aligned
@@ -156,6 +164,9 @@ protected:
 private:
   /// FCI maps for each of the parallel slices
   std::vector<FCIMap> field_line_maps;
+
+  /// Real-space coordinates of grid points
+  Field3D R, Z;
 };
 
 #endif // BOUT_FCITRANSFORM_H

From 91ddbfd2af7cf85b442c70b1df250d0f282a9c0c Mon Sep 17 00:00:00 2001
From: Ben Dudson <dudson2@llnl.gov>
Date: Wed, 5 Mar 2025 14:52:03 -0800
Subject: [PATCH 021/129] Mesh, BoutMesh, Coordinates: update header comment

Update copyright statement, contact email.
---
 include/bout/coordinates.hxx     |  4 ++--
 include/bout/mesh.hxx            |  4 ++--
 src/mesh/impls/bout/boutmesh.cxx | 13 ++-----------
 3 files changed, 6 insertions(+), 15 deletions(-)

diff --git a/include/bout/coordinates.hxx b/include/bout/coordinates.hxx
index fb2fade75d..908c052e73 100644
--- a/include/bout/coordinates.hxx
+++ b/include/bout/coordinates.hxx
@@ -9,9 +9,9 @@
  *
  * 
  **************************************************************************
- * Copyright 2014 B.D.Dudson
+ * Copyright 2014-2025 BOUT++ contributors
  *
- * Contact: Ben Dudson, bd512@york.ac.uk
+ * Contact: Ben Dudson, dudson2@llnl.gov
  * 
  * This file is part of BOUT++.
  *
diff --git a/include/bout/mesh.hxx b/include/bout/mesh.hxx
index a1c88a2634..fc65dd8e0c 100644
--- a/include/bout/mesh.hxx
+++ b/include/bout/mesh.hxx
@@ -17,9 +17,9 @@
  *     * Incorporates code from topology.cpp and Communicator
  *
  **************************************************************************
- * Copyright 2010 B.D.Dudson, S.Farley, M.V.Umansky, X.Q.Xu
+ * Copyright 2010-2025 BOUT++ contributors
  *
- * Contact: Ben Dudson, bd512@york.ac.uk
+ * Contact: Ben Dudson, dudson2@llnl.gov
  * 
  * This file is part of BOUT++.
  *
diff --git a/src/mesh/impls/bout/boutmesh.cxx b/src/mesh/impls/bout/boutmesh.cxx
index 31319b87d1..9214c56855 100644
--- a/src/mesh/impls/bout/boutmesh.cxx
+++ b/src/mesh/impls/bout/boutmesh.cxx
@@ -2,19 +2,10 @@
  * Implementation of the Mesh class, handling input files compatible with
  * BOUT / BOUT-06.
  *
- * Changelog
- * ---------
- *
- * 2015-01 Ben Dudson <benjamin.dudson@york.ac.uk>
- *      *
- *
- * 2010-05 Ben Dudson <bd512@york.ac.uk>
- *      * Initial version, adapted from grid.cpp and topology.cpp
- *
  **************************************************************************
- * Copyright 2010 B.D.Dudson, S.Farley, M.V.Umansky, X.Q.Xu
+ * Copyright 2010-2025 BOUT++ contributors
  *
- * Contact: Ben Dudson, bd512@york.ac.uk
+ * Contact: Ben Dudson, dudson2@llnl.gov
  *
  * This file is part of BOUT++.
  *

From 33d78feb1b3a764e08be6156ff7894d6430c9b1b Mon Sep 17 00:00:00 2001
From: Ben Dudson <dudson2@llnl.gov>
Date: Wed, 5 Mar 2025 16:05:32 -0800
Subject: [PATCH 022/129] Apply suggestions from code review

Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com>
---
 examples/elm-pb/elm_pb.cxx | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/examples/elm-pb/elm_pb.cxx b/examples/elm-pb/elm_pb.cxx
index b36bd728d4..1a2608e62c 100644
--- a/examples/elm-pb/elm_pb.cxx
+++ b/examples/elm-pb/elm_pb.cxx
@@ -1364,7 +1364,7 @@ class ELMpb : public PhysicsModel {
           // Only update if simulation time has advanced
           // Uses an exponential decay of the weighting of the value in the boundary
           // so that the solution is well behaved for arbitrary steps
-          BoutReal weight = exp(-(t - phi_boundary_last_update) / phi_boundary_timescale);
+          BoutReal const weight = exp(-(t - phi_boundary_last_update) / phi_boundary_timescale);
           phi_boundary_last_update = t;
 
           if (mesh->firstX()) {
@@ -1378,7 +1378,7 @@ class ELMpb : public PhysicsModel {
                 }
               }
               MPI_Comm comm_inner = mesh->getYcomm(0);
-              int np;
+              int np = 0;
               MPI_Comm_size(comm_inner, &np);
               MPI_Allreduce(&philocal, &phivalue, 1, MPI_DOUBLE, MPI_SUM, comm_inner);
               phivalue /= (np * mesh->LocalNz * mesh->LocalNy);
@@ -1393,11 +1393,11 @@ class ELMpb : public PhysicsModel {
               }
 
               // Old value of phi at boundary. Note: this is constant in Z
-              BoutReal oldvalue =
+              BoutReal const oldvalue =
                   0.5 * (phi(mesh->xstart - 1, j, 0) + phi(mesh->xstart, j, 0));
 
               // New value of phi at boundary, relaxing towards phivalue
-              BoutReal newvalue = weight * oldvalue + (1. - weight) * phivalue;
+              BoutReal const newvalue = weight * oldvalue + (1. - weight) * phivalue;
 
               // Set phi at the boundary to this value
               for (int k = 0; k < mesh->LocalNz; k++) {
@@ -1420,7 +1420,7 @@ class ELMpb : public PhysicsModel {
                   0.5 * (phi(mesh->xend + 1, j, 0) + phi(mesh->xend, j, 0));
 
               // New value of phi at boundary, relaxing towards phivalue
-              BoutReal newvalue = weight * oldvalue + (1. - weight) * phivalue;
+              BoutReal const newvalue = weight * oldvalue + (1. - weight) * phivalue;
 
               // Set phi at the boundary to this value
               for (int k = 0; k < mesh->LocalNz; k++) {

From 08b1261f86e38eb45864265a4d48ec644545256b Mon Sep 17 00:00:00 2001
From: Ben Dudson <dudson2@llnl.gov>
Date: Thu, 6 Mar 2025 09:43:05 -0800
Subject: [PATCH 023/129] hypre_interface: Moved BC elimination to
 src/sys/hypre_interface.cxx

Changed C free functions to be members of BCMatrixEquations.
Clang formatted, minor style changes. Test results unchanged.
---
 CMakeLists.txt                                |   1 +
 include/bout/hypre_interface.hxx              | 187 +++++++--------
 .../laplace/impls/hypre3d/hypre3d_laplace.cxx |   1 -
 .../laplace/impls/hypre3d/hypre_boundary.c    | 222 ------------------
 src/sys/hypre_interface.cxx                   | 131 +++++++++++
 5 files changed, 215 insertions(+), 327 deletions(-)
 delete mode 100644 src/invert/laplace/impls/hypre3d/hypre_boundary.c
 create mode 100644 src/sys/hypre_interface.cxx

diff --git a/CMakeLists.txt b/CMakeLists.txt
index c45fca3b72..af628a7db5 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -335,6 +335,7 @@ set(BOUT_SOURCES
   ./src/sys/generator_context.cxx
   ./include/bout/hyprelib.hxx
   ./src/sys/hyprelib.cxx
+  ./src/sys/hypre_interface.cxx
   ./src/sys/msg_stack.cxx
   ./src/sys/options.cxx
   ./src/sys/options/optionparser.hxx
diff --git a/include/bout/hypre_interface.hxx b/include/bout/hypre_interface.hxx
index c8377f7f5a..33e6218c8f 100644
--- a/include/bout/hypre_interface.hxx
+++ b/include/bout/hypre_interface.hxx
@@ -20,45 +20,6 @@
 #include "HYPRE_utilities.h"
 #include "_hypre_utilities.h"
 
-void
-AdjustBCMatrixEquations(
-   HYPRE_Int       nrows,
-   HYPRE_Int      *ncols,
-   HYPRE_BigInt   *rows,
-   HYPRE_Int     **row_indexes_ptr,
-   HYPRE_BigInt   *cols,
-   HYPRE_Complex  *values,
-   HYPRE_Int       nb,              // number of boundary equations
-   HYPRE_Int      *bi_array,        // row i for each boundary equation
-   HYPRE_Int     **binum_array_ptr, // data index for row i (for each boundary equation)
-   HYPRE_Int     **bjnum_array_ptr, // data index for col j (for each boundary equation)
-   HYPRE_Complex **bii_array_ptr,   // coefficient b_ii (for each boundary equation)
-   HYPRE_Complex **bij_array_ptr,   // coefficient b_ij (for each boundary equation)
-   HYPRE_Int      *na_ptr,          // number of interior equations to adjust
-   HYPRE_Int     **aknum_array_ptr, // data index for row k (for each interior equation)
-   HYPRE_Complex **aki_array_ptr);  // coefficient a_ki (for each interior equation)
-
-void
-AdjustBCRightHandSideEquations(
-   HYPRE_Complex  *rhs,
-   HYPRE_Int       nb,
-   HYPRE_Int      *binum_array,
-   HYPRE_Complex  *bii_array,
-   HYPRE_Complex **brhs_array_ptr,
-   HYPRE_Int       na,
-   HYPRE_Int      *aknum_array,
-   HYPRE_Complex  *aki_array);
-
-void
-AdjustBCSolutionEquations(
-   HYPRE_Complex  *solution,
-   HYPRE_Int       nb,
-   HYPRE_Int      *binum_array,
-   HYPRE_Int      *bjnum_array,
-   HYPRE_Complex  *bii_array,
-   HYPRE_Complex  *bij_array,
-   HYPRE_Complex  *brhs_array);
-
 #include <memory>
 
 // BOUT_ENUM_CLASS does not work inside namespaces
@@ -99,46 +60,83 @@ int checkHypreError(int error) {
 
 /// Wrapper around HYPRE_Complex, that calls HypreFree when destroyed.
 struct HypreComplexArray {
-  HYPRE_Complex *data;
+  HYPRE_Complex* data;
 
-  ~HypreComplexArray() {
-    HypreFree(data);
-  }
+  HypreComplexArray(int n) { HypreMalloc(data, sizeof(HYPRE_Complex) * n); }
+
+  ~HypreComplexArray() { HypreFree(data); }
 };
 
 /// Shared pointter to a HypreComplexArray. When the last copy is destroyed
 /// the HYPRE_Complex array inside will be free'd.
 using BCValuesPtr = std::shared_ptr<HypreComplexArray>;
 
-/// Contains information needed to eliminate boundary equations from
-/// RHS vectors, and restore boundary values in solution vectors.
+/*!
+ * This function modifies the input for the HYPRE_IJMatrixSetValues() routine to
+ * eliminate the boundary condition equations (see below for details on how the
+ * equations are adjusted).  It modifies the arrays ncols, rows, cols, and
+ * values.  It also returns a row_indexes array.  This can then be passed to the
+ * HYPRE_IJMatrixSetValues2() routine to set up the matrix in hypre.
+ *
+ * The arguments nb and bi_array indicate the boundary equations.  The routine
+ * returns info needed to adjust the right-hand-side and solution vector through
+ * the functions AdjustRightHandSideEquations and AdjustSolutionEquations.
+ *
+ * NOTE: It may make sense from an organizational standpoint to collect many of
+ * these arguments in a structure of some sort.
+ *
+ * Notation, assumptions, and other details:
+ *
+ * - Boundary equation i is assumed to have two coefficients
+ *
+ *      b_ii * u_i + b_ij * u_j = rhs_i
+ *
+ * - We also assume that each boundary equation has only one interior equation k
+ *   coupled to it (such that k = j) with coupling coefficient a_ki
+ *
+ *      a_ki * u_i + a_kj * u_j + ... = rhs_k
+ *
+ * - Each equation k is adjusted as follows:
+ *
+ *      a_kj = a_kj - a_ki * b_ij / b_ii
+ *      a_ki = 0
+ *
+ * - Boundary equations are adjusted to be identity equations in the matrix, but
+ *   the boundary coefficients (b_ii, b_ij) are returned for use later
+ *
+ * - Right-hand-side equations are adjusted in AdjustRightHandSideEquations() as
+ *   follows: rhs_k = rhs_k - a_ki * rhs_i / b_ii
+ *
+ * - Solution unknowns are adjusted at boundaries in AdjustSolutionEquations as
+ *   follows: u_i = (rhs_i - b_ij * u_j) / b_ii
+ *
+ * - Naming conventions: Arrays starting with 'b' are boundary equation arrays
+ *   indexed by 'bnum', and arrays starting with 'a' are non-boundary arrays
+ *   (interior matrix equations) indexed by 'anum'.  When 'num' is prefixed with
+ *   a row or column number 'i', 'j', or 'k', the array holds the corresponding
+ *   local data index for that row or column (e.g., an index into the local
+ *   solution vector).  Matrix coefficients are named as above, e.g., 'bij' is
+ *   the coefficient for b_ij.
+ *
+ *   NOTE: Implementation in src/sys/hypre_interface.cxx
+ */
 struct BCMatrixEquations {
-  HYPRE_Int      nb;
-  HYPRE_Int     *binum_array;
-  HYPRE_Int     *bjnum_array;
-  HYPRE_Complex *bii_array;
-  HYPRE_Complex *bij_array;
-  HYPRE_Int      na;
-  HYPRE_Int     *aknum_array;
-  HYPRE_Complex *aki_array;
+  HYPRE_Int nb;
+  HYPRE_Int* binum_array;
+  HYPRE_Int* bjnum_array;
+  HYPRE_Complex* bii_array;
+  HYPRE_Complex* bij_array;
+  HYPRE_Int na;
+  HYPRE_Int* aknum_array;
+  HYPRE_Complex* aki_array;
 
   BCMatrixEquations() = delete;
 
-  BCMatrixEquations(HYPRE_Int       nrows,
-                    HYPRE_Int      *ncols,
-                    HYPRE_BigInt   *rows,
-                    HYPRE_Int     **row_indexes_ptr,
-                    HYPRE_BigInt   *cols,
-                    HYPRE_Complex  *values,
-                    HYPRE_Int       nb,             // number of boundary equations
-                    HYPRE_Int      *bi_array)       // row i for each boundary equation
-    : nb(nb) {
-    AdjustBCMatrixEquations(nrows, ncols, rows, row_indexes_ptr, cols, values,
-                            nb, bi_array,
-                            // Outputs
-                            &binum_array, &bjnum_array, &bii_array, &bij_array,
-                            &na, &aknum_array, &aki_array);
-  }
+  BCMatrixEquations(HYPRE_Int nrows, HYPRE_Int* ncols, HYPRE_BigInt* rows,
+                    HYPRE_Int** row_indexes_ptr, HYPRE_BigInt* cols,
+                    HYPRE_Complex* values,
+                    HYPRE_Int nb,         // number of boundary equations
+                    HYPRE_Int* bi_array); // row i for each boundary equation
 
   ~BCMatrixEquations() {
     // Free arrays
@@ -154,25 +152,16 @@ struct BCMatrixEquations {
   ///
   /// Returns an array of boundary values that can be used to apply
   /// boundary conditions to a solution vector.
-  BCValuesPtr adjustBCRightHandSideEquations(HYPRE_Complex *rhs) {
-    BCValuesPtr brhs = std::make_shared<HypreComplexArray>();
-    AdjustBCRightHandSideEquations(rhs, nb, binum_array, bii_array, &brhs->data,
-                                   na, aknum_array, aki_array);
-    return brhs;
-  }
+  BCValuesPtr adjustBCRightHandSideEquations(HYPRE_Complex* rhs);
 
   /// Apply boundary conditions to the solution.
   /// Uses the BCValuesPtr returned from adjustBCRightHandSideEquations()
-  void adjustBCSolutionEquations(BCValuesPtr brhs, HYPRE_Complex *solution) {
-    AdjustBCSolutionEquations(solution, nb,
-                              binum_array, bjnum_array, bii_array, bij_array, brhs->data);
-  }
+  void adjustBCSolutionEquations(BCValuesPtr brhs, HYPRE_Complex* solution);
 };
 
 /// A shared pointer to a BCMatrixEquations object
 using BCMatrixPtr = std::shared_ptr<BCMatrixEquations>;
 
-
 template <class T>
 class HypreVector {
   MPI_Comm comm;
@@ -293,11 +282,9 @@ public:
   bool elimBErhs = false;
   bool elimBEsol = false;
   BCMatrixPtr bcmatrix;
-  BCValuesPtr bcvalues;  /// Stores rhs values of BC rows
+  BCValuesPtr bcvalues; /// Stores rhs values of BC rows
 
-  void syncElimBErhs(HypreVector<T>& rhs) {
-    bcvalues = rhs.bcvalues;
-  }
+  void syncElimBErhs(HypreVector<T>& rhs) { bcvalues = rhs.bcvalues; }
 
   void assemble() {
     CALI_CXX_MARK_FUNCTION;
@@ -802,9 +789,7 @@ public:
   bool elimBE = false;
   BCMatrixPtr bcmatrix; // Shared pointer
 
-  void setElimBE() {
-    elimBE = true;
-  }
+  void setElimBE() { elimBE = true; }
 
   void setElimBEVectors(HypreVector<T>& sol, HypreVector<T>& rhs) {
     sol.elimBEsol = elimBE;
@@ -845,34 +830,28 @@ public:
 
     // Eliminate boundary condition equations in hypre SetValues input arguments
     if (elimBE) {
-      HYPRE_Int *bi_array;
-      HYPRE_Int *row_indexes;
+      HYPRE_Int* bi_array;
+      HYPRE_Int* row_indexes;
       // There must be an easier way to get nb
       int nb = 0;
-      BOUT_FOR_SERIAL(i, index_converter->getRegionBndry()) {
-         nb++;
-      }
+      BOUT_FOR_SERIAL(i, index_converter->getRegionBndry()) { nb++; }
       HypreMalloc(bi_array, nb * sizeof(HYPRE_Int));
       nb = 0;
       BOUT_FOR_SERIAL(i, index_converter->getRegionBndry()) {
-         bi_array[nb] = index_converter->getGlobal(i);
-         nb++;
+        bi_array[nb] = index_converter->getGlobal(i);
+        nb++;
       }
 
-      bcmatrix = std::make_shared<BCMatrixEquations>(num_rows, num_cols,
-                                                     rawI, &row_indexes,
-                                                     cols, vals,
-                                                     nb, bi_array);
+      bcmatrix = std::make_shared<BCMatrixEquations>(
+          num_rows, num_cols, rawI, &row_indexes, cols, vals, nb, bi_array);
       HypreFree(bi_array);
 
-      checkHypreError(
-        HYPRE_IJMatrixSetValues2(*hypre_matrix, num_rows, num_cols, rawI, row_indexes, cols, vals));
+      checkHypreError(HYPRE_IJMatrixSetValues2(*hypre_matrix, num_rows, num_cols, rawI,
+                                               row_indexes, cols, vals));
       HypreFree(row_indexes);
-    }
-    else
-    {
+    } else {
       checkHypreError(
-        HYPRE_IJMatrixSetValues(*hypre_matrix, num_rows, num_cols, rawI, cols, vals));
+          HYPRE_IJMatrixSetValues(*hypre_matrix, num_rows, num_cols, rawI, cols, vals));
     }
     checkHypreError(HYPRE_IJMatrixAssemble(*hypre_matrix));
     checkHypreError(HYPRE_IJMatrixGetObject(*hypre_matrix,
@@ -1055,7 +1034,7 @@ public:
 
     switch (solver_type) {
     case HYPRE_SOLVER_TYPE::gmres: {
-       HYPRE_ParCSRGMRESSetKDim(solver, 30);  // TODO: Make this an input file parameter
+      HYPRE_ParCSRGMRESSetKDim(solver, 30); // TODO: Make this an input file parameter
       break;
     }
     case HYPRE_SOLVER_TYPE::bicgstab: {
diff --git a/src/invert/laplace/impls/hypre3d/hypre3d_laplace.cxx b/src/invert/laplace/impls/hypre3d/hypre3d_laplace.cxx
index def54b36b5..beb83a216d 100644
--- a/src/invert/laplace/impls/hypre3d/hypre3d_laplace.cxx
+++ b/src/invert/laplace/impls/hypre3d/hypre3d_laplace.cxx
@@ -28,7 +28,6 @@
 #if BOUT_HAS_HYPRE
 
 #include "hypre3d_laplace.hxx"
-#include "hypre_boundary.c"
 
 #include <bout/assert.hxx>
 #include <bout/boutcomm.hxx>
diff --git a/src/invert/laplace/impls/hypre3d/hypre_boundary.c b/src/invert/laplace/impls/hypre3d/hypre_boundary.c
deleted file mode 100644
index 30f0968765..0000000000
--- a/src/invert/laplace/impls/hypre3d/hypre_boundary.c
+++ /dev/null
@@ -1,222 +0,0 @@
-
-/*
- * This function modifies the input for the HYPRE_IJMatrixSetValues() routine to
- * eliminate the boundary condition equations (see below for details on how the
- * equations are adjusted).  It modifies the arrays ncols, rows, cols, and
- * values.  It also returns a row_indexes array.  This can then be passed to the
- * HYPRE_IJMatrixSetValues2() routine to set up the matrix in hypre.
- *
- * The arguments nb and bi_array indicate the boundary equations.  The routine
- * returns info needed to adjust the right-hand-side and solution vector through
- * the functions AdjustRightHandSideEquations and AdjustSolutionEquations.
- *
- * NOTE: It may make sense from an organizational standpoint to collect many of
- * these arguments in a structure of some sort.
- *
- * Notation, assumptions, and other details:
- *
- * - Boundary equation i is assumed to have two coefficients
- *
- *      b_ii * u_i + b_ij * u_j = rhs_i
- *
- * - We also assume that each boundary equation has only one interior equation k
- *   coupled to it (such that k = j) with coupling coefficient a_ki
- *
- *      a_ki * u_i + a_kj * u_j + ... = rhs_k
- *
- * - Each equation k is adjusted as follows:
- *
- *      a_kj = a_kj - a_ki * b_ij / b_ii
- *      a_ki = 0
- *
- * - Boundary equations are adjusted to be identity equations in the matrix, but
- *   the boundary coefficients (b_ii, b_ij) are returned for use later
- *
- * - Right-hand-side equations are adjusted in AdjustRightHandSideEquations() as
- *   follows: rhs_k = rhs_k - a_ki * rhs_i / b_ii
- *
- * - Solution unknowns are adjusted at boundaries in AdjustSolutionEquations as
- *   follows: u_i = (rhs_i - b_ij * u_j) / b_ii
- *
- * - Naming conventions: Arrays starting with 'b' are boundary equation arrays
- *   indexed by 'bnum', and arrays starting with 'a' are non-boundary arrays
- *   (interior matrix equations) indexed by 'anum'.  When 'num' is prefixed with
- *   a row or column number 'i', 'j', or 'k', the array holds the corresponding
- *   local data index for that row or column (e.g., an index into the local
- *   solution vector).  Matrix coefficients are named as above, e.g., 'bij' is
- *   the coefficient for b_ij.
- */
-
-void
-AdjustBCMatrixEquations(
-   HYPRE_Int       nrows,
-   HYPRE_Int      *ncols,
-   HYPRE_BigInt   *rows,
-   HYPRE_Int     **row_indexes_ptr,
-   HYPRE_BigInt   *cols,
-   HYPRE_Complex  *values,
-   HYPRE_Int       nb,              // number of boundary equations
-   HYPRE_Int      *bi_array,        // row i for each boundary equation
-   HYPRE_Int     **binum_array_ptr, // data index for row i (for each boundary equation)
-   HYPRE_Int     **bjnum_array_ptr, // data index for col j (for each boundary equation)
-   HYPRE_Complex **bii_array_ptr,   // coefficient b_ii (for each boundary equation)
-   HYPRE_Complex **bij_array_ptr,   // coefficient b_ij (for each boundary equation)
-   HYPRE_Int      *na_ptr,          // number of interior equations to adjust
-   HYPRE_Int     **aknum_array_ptr, // data index for row k (for each interior equation)
-   HYPRE_Complex **aki_array_ptr)   // coefficient a_ki (for each interior equation)
-{
-   HYPRE_Int     *row_indexes;
-   HYPRE_Int      na, *binum_array, *bjnum_array, *aknum_array;
-   HYPRE_Complex *bii_array, *bij_array, *aki_array;
-   HYPRE_Int      i, j, k, m, mkj, anum, bnum, acoeffnum, bcoeffnum;
-   HYPRE_Int      binum, aknum;
-   HYPRE_Complex  bii, bij, aki;
-
-   /* Create the row_indexes array */
-   row_indexes = (HYPRE_Int *)malloc(sizeof(HYPRE_Int) * nrows);
-   row_indexes[0] = 0;
-   for (i = 1; i < nrows; i++)
-   {
-      row_indexes[i] = row_indexes[i-1] + ncols[i-1];
-   }
-
-   /* Assume just one interior equation coupled to each boundary equation */
-   na = nb;
-
-   /* Allocate return arrays */
-   HypreMalloc(binum_array, sizeof(HYPRE_Int) * nb);
-   HypreMalloc(bjnum_array, sizeof(HYPRE_Int) * nb);
-   HypreMalloc(bii_array,   sizeof(HYPRE_Complex) * nb);
-   HypreMalloc(bij_array,   sizeof(HYPRE_Complex) * nb);
-   HypreMalloc(aknum_array, sizeof(HYPRE_Int) * na);
-   HypreMalloc(aki_array,   sizeof(HYPRE_Complex) * na);
-
-   binum = 0;
-   aknum = 0;
-   for (bnum = 0; bnum < nb; bnum++)
-   {
-      /* Get boundary equation information and adjust boundary equations */
-      /* Find row i in rows array (assume i increases and rows is sorted) */
-      i = bi_array[bnum];
-      for (; binum < nrows; binum++)
-      {
-         if (i == rows[binum])
-         {
-            break;   // Found row i in rows array
-         }
-      }
-      bcoeffnum = row_indexes[binum];
-      for (m = 0; m < 2; m++)               // Assume only two boundary equation coefficients
-      {
-         if (cols[bcoeffnum + m] == i)
-         {
-            bii = values[bcoeffnum + m];
-            values[bcoeffnum + m] = -1.0;   // Identity equation (negative definite matrix)
-         }
-         else
-         {
-            j = cols[bcoeffnum + m];
-            bij = values[bcoeffnum + m];
-            values[bcoeffnum + m] = 0.0;   // Identity equation
-         }
-      }
-      ncols[binum] = 1;                  // Identity equation
-
-      /* Get interior equation information and adjust interior equations */
-      /* Find row k in rows array (assume k increases and rows is sorted) */
-      k = j;         // Assume equation k = j
-      for (; aknum < nrows; aknum++)
-      {
-         if (k == rows[aknum])
-         {
-            break;   // Found row k in rows array
-         }
-      }
-      acoeffnum = row_indexes[aknum];
-      for (m = 0; m < ncols[aknum]; m++)
-      {
-         if (cols[acoeffnum + m] == j)
-         {
-            mkj = m;                       // Save for update of akj value below
-         }
-         if (cols[acoeffnum + m] == i)
-         {
-            aki = values[acoeffnum + m];
-            values[acoeffnum + m] = 0.0;   // Eliminate coupling to boundary equation
-         }
-      }
-      values[acoeffnum + mkj] -= aki * bij / bii;   // Update akj value
-
-      /* Update return arrays */
-      anum = bnum;                // Assume only one interior equation k
-      binum_array[bnum] = binum;
-      bjnum_array[bnum] = aknum;  // Assume only one interior equation k
-      bii_array[bnum]   = bii;
-      bij_array[bnum]   = bij;
-      aknum_array[anum] = aknum;
-      aki_array[anum]   = aki;
-   }
-
-   /* Set return arguments */
-   *row_indexes_ptr = row_indexes;
-   *binum_array_ptr = binum_array;
-   *bjnum_array_ptr = bjnum_array;
-   *bii_array_ptr   = bii_array;
-   *bij_array_ptr   = bij_array;
-   *na_ptr          = na;
-   *aknum_array_ptr = aknum_array;
-   *aki_array_ptr   = aki_array;
-}
-
-void
-AdjustBCRightHandSideEquations(
-   HYPRE_Complex  *rhs,
-   HYPRE_Int       nb,
-   HYPRE_Int      *binum_array,
-   HYPRE_Complex  *bii_array,
-   HYPRE_Complex **brhs_array_ptr,
-   HYPRE_Int       na,
-   HYPRE_Int      *aknum_array,
-   HYPRE_Complex  *aki_array)
-{
-   HYPRE_Complex *brhs_array;
-   HYPRE_Int      anum, bnum, binum, aknum;
-
-   HypreMalloc(brhs_array, sizeof(HYPRE_Complex) * nb);
-
-   for (bnum = 0; bnum < nb; bnum++)
-   {
-      binum = binum_array[bnum];
-      brhs_array[bnum] = rhs[binum];
-   }
-
-   for (anum = 0; anum < na; anum++)
-   {
-      bnum  = anum;   // Assume only one interior equation per boundary equation
-      aknum = aknum_array[anum];
-      rhs[aknum] -= aki_array[anum] * brhs_array[bnum] / bii_array[bnum];
-   }
-
-   *brhs_array_ptr = brhs_array;
-}
-
-void
-AdjustBCSolutionEquations(
-   HYPRE_Complex  *solution,
-   HYPRE_Int       nb,
-   HYPRE_Int      *binum_array,
-   HYPRE_Int      *bjnum_array,
-   HYPRE_Complex  *bii_array,
-   HYPRE_Complex  *bij_array,
-   HYPRE_Complex  *brhs_array)
-{
-   HYPRE_Int  bnum, binum, bjnum;
-
-   for (bnum = 0; bnum < nb; bnum++)
-   {
-      binum = binum_array[bnum];
-      bjnum = bjnum_array[bnum];
-      solution[binum] = (brhs_array[bnum] - bij_array[bnum] * solution[bjnum]) / bii_array[bnum];
-   }
-}
-
diff --git a/src/sys/hypre_interface.cxx b/src/sys/hypre_interface.cxx
new file mode 100644
index 0000000000..1838bd5158
--- /dev/null
+++ b/src/sys/hypre_interface.cxx
@@ -0,0 +1,131 @@
+
+#include "bout/build_defines.hxx"
+
+#if BOUT_HAS_HYPRE
+
+#include "bout/hypre_interface.hxx"
+
+namespace bout {
+
+BCMatrixEquations::BCMatrixEquations(HYPRE_Int nrows, HYPRE_Int* ncols,
+                                     HYPRE_BigInt* rows, HYPRE_Int** row_indexes_ptr,
+                                     HYPRE_BigInt* cols, HYPRE_Complex* values,
+                                     HYPRE_Int nb, HYPRE_Int* bi_array)
+    : nb(nb) {
+  HYPRE_Int* row_indexes;
+
+  // Create the row_indexes array
+  row_indexes = (HYPRE_Int*)malloc(sizeof(HYPRE_Int) * nrows);
+  row_indexes[0] = 0;
+  for (HYPRE_Int i = 1; i < nrows; i++) {
+    row_indexes[i] = row_indexes[i - 1] + ncols[i - 1];
+  }
+
+  // Assume just one interior equation coupled to each boundary equation
+  na = nb;
+
+  // Allocate arrays
+  HypreMalloc(binum_array, sizeof(HYPRE_Int) * nb);
+  HypreMalloc(bjnum_array, sizeof(HYPRE_Int) * nb);
+  HypreMalloc(bii_array, sizeof(HYPRE_Complex) * nb);
+  HypreMalloc(bij_array, sizeof(HYPRE_Complex) * nb);
+  HypreMalloc(aknum_array, sizeof(HYPRE_Int) * na);
+  HypreMalloc(aki_array, sizeof(HYPRE_Complex) * na);
+
+  HYPRE_Int binum = 0;
+  HYPRE_Int aknum = 0;
+  for (HYPRE_Int bnum = 0; bnum < nb; bnum++) {
+    // Get boundary equation information and adjust boundary equations
+    // Find row i in rows array (assume i increases and rows is sorted)
+    HYPRE_Int i = bi_array[bnum];
+    for (; binum < nrows; binum++) {
+      if (i == rows[binum]) {
+        break; // Found row i in rows array
+      }
+    }
+    HYPRE_Int bcoeffnum = row_indexes[binum];
+    HYPRE_Complex bii{0.0}, bij{0.0};
+    HYPRE_Int j = 0;
+
+    for (HYPRE_Int m = 0; m < 2; m++) { // Assume only two boundary equation coefficients
+      if (cols[bcoeffnum + m] == i) {
+        bii = values[bcoeffnum + m];
+        values[bcoeffnum + m] = -1.0; // Identity equation (negative definite matrix)
+      } else {
+        j = cols[bcoeffnum + m];
+        bij = values[bcoeffnum + m];
+        values[bcoeffnum + m] = 0.0; // Identity equation
+      }
+    }
+    ncols[binum] = 1; // Identity equation
+
+    /* Get interior equation information and adjust interior equations */
+    /* Find row k in rows array (assume k increases and rows is sorted) */
+    HYPRE_Int k = j; // Assume equation k = j
+    for (; aknum < nrows; aknum++) {
+      if (k == rows[aknum]) {
+        break; // Found row k in rows array
+      }
+    }
+    HYPRE_Int acoeffnum = row_indexes[aknum];
+
+    HYPRE_Int mkj = 0;
+    HYPRE_Complex aki{0.0};
+    for (HYPRE_Int m = 0; m < ncols[aknum]; m++) {
+      if (cols[acoeffnum + m] == j) {
+        mkj = m; // Save for update of akj value below
+      }
+      if (cols[acoeffnum + m] == i) {
+        aki = values[acoeffnum + m];
+        values[acoeffnum + m] = 0.0; // Eliminate coupling to boundary equation
+      }
+    }
+    values[acoeffnum + mkj] -= aki * bij / bii; // Update akj value
+
+    // Update arrays
+    HYPRE_Int anum = bnum; // Assume only one interior equation k
+    binum_array[bnum] = binum;
+    bjnum_array[bnum] = aknum; // Assume only one interior equation k
+    bii_array[bnum] = bii;
+    bij_array[bnum] = bij;
+    aknum_array[anum] = aknum;
+    aki_array[anum] = aki;
+  }
+
+  // Set return arguments
+  *row_indexes_ptr = row_indexes;
+}
+
+BCValuesPtr BCMatrixEquations::adjustBCRightHandSideEquations(HYPRE_Complex* rhs) {
+
+  // Allocate array to store boundary row values
+  BCValuesPtr brhs = std::make_shared<HypreComplexArray>(nb);
+
+  for (HYPRE_Int bnum = 0; bnum < nb; bnum++) {
+    HYPRE_Int binum = binum_array[bnum];
+    brhs->data[bnum] = rhs[binum];
+  }
+
+  for (HYPRE_Int anum = 0; anum < na; anum++) {
+    HYPRE_Int bnum = anum; // Assume only one interior equation per boundary equation
+    HYPRE_Int aknum = aknum_array[anum];
+    rhs[aknum] -= aki_array[anum] * brhs->data[bnum] / bii_array[bnum];
+  }
+
+  return brhs;
+}
+
+void BCMatrixEquations::adjustBCSolutionEquations(BCValuesPtr brhs,
+                                                  HYPRE_Complex* solution) {
+
+  for (HYPRE_Int bnum = 0; bnum < nb; bnum++) {
+    HYPRE_Int binum = binum_array[bnum];
+    HYPRE_Int bjnum = bjnum_array[bnum];
+    solution[binum] =
+        (brhs->data[bnum] - bij_array[bnum] * solution[bjnum]) / bii_array[bnum];
+  }
+}
+
+} // namespace bout
+
+#endif // BOUT_HAS_HYPRE

From eea57fc2c1a798a80eca0d7687fa8219ffe09f9a Mon Sep 17 00:00:00 2001
From: Ben Dudson <dudson2@llnl.gov>
Date: Thu, 6 Mar 2025 09:44:53 -0800
Subject: [PATCH 024/129] test-laplace-hypre3d: Suppress BOUT++ log outputs

Difficult to see the test results amongst the log outputs.
Now pipe the logs and save to files.
---
 tests/integrated/test-laplace-hypre3d/runtest | 14 +++++++++-----
 1 file changed, 9 insertions(+), 5 deletions(-)

diff --git a/tests/integrated/test-laplace-hypre3d/runtest b/tests/integrated/test-laplace-hypre3d/runtest
index b50c5993b7..f1f5950547 100755
--- a/tests/integrated/test-laplace-hypre3d/runtest
+++ b/tests/integrated/test-laplace-hypre3d/runtest
@@ -19,20 +19,24 @@ build_and_log("Laplace 3D with Hypre")
 
 success = True
 for directory, nproc in test_directories:
-    command = "test-laplace3d -d " + directory
+    command = "./test-laplace3d -d " + directory
     print("running on", nproc, "processors:", command)
-    launch_safe(command, nproc=nproc)
+    s, out = launch_safe(command, nproc=nproc, pipe=True)
+    # Save output to log file
+    with open("run.log." + directory, "w") as f:
+        f.write(out)
 
     error_max = collect("error_max", path=directory, info=False)
 
     if error_max > tolerance:
-        print(directory + " failed with maximum error {}".format(error_max))
+        print(" => " + directory + " failed with maximum error {}".format(error_max))
         success = False
     else:
-        print(directory + " passed with maximum error {}".format(error_max))
+        print(" => " + directory + " passed with maximum error {}".format(error_max))
 
 if success:
-    print("All passed")
+    print("=> All passed")
     exit(0)
 else:
+    print("=> Some tests failed")
     exit(1)

From ef9fbed3e68ff6ea45294e95cb174457cc5c939b Mon Sep 17 00:00:00 2001
From: bendudson <219233+bendudson@users.noreply.github.com>
Date: Thu, 6 Mar 2025 17:46:47 +0000
Subject: [PATCH 025/129] Apply black changes

---
 tests/integrated/test_suite | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/integrated/test_suite b/tests/integrated/test_suite
index 307a8d84b3..77ad7882c4 100755
--- a/tests/integrated/test_suite
+++ b/tests/integrated/test_suite
@@ -188,7 +188,7 @@ class Test(threading.Thread):
                 self.output += "\n(It is likely that a timeout occured)"
             else:
                 # ❌ Failed
-                print("\u274C", end="")  # No newline
+                print("\u274c", end="")  # No newline
             print(" %7.3f s" % (time.time() - self.local.start_time), flush=True)
 
     def _cost(self):

From af72bd8f83e4ba5770d1800dd25bede21f6f1724 Mon Sep 17 00:00:00 2001
From: David Bold <dave@ipp.mpg.de>
Date: Thu, 6 Mar 2025 19:52:51 +0100
Subject: [PATCH 026/129] Do not fail if clang-format is formatting the code

The CI job failed so far, if it had to format the code,
as the return code is only zero if nothing needs to be
done.
---
 .github/workflows/clang-format.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/clang-format.yml b/.github/workflows/clang-format.yml
index 87f1947802..a6508a2dcd 100644
--- a/.github/workflows/clang-format.yml
+++ b/.github/workflows/clang-format.yml
@@ -22,7 +22,7 @@ jobs:
 
       - name: Run clang-format
         id: format
-        run: git clang-format origin/${{ github.base_ref }}
+        run: git clang-format origin/${{ github.base_ref }} || :
 
       - name: Commit to the PR branch
         uses: stefanzweifel/git-auto-commit-action@v5

From aeb83c6c18cc5fd59e9149d3a507185ab87ad453 Mon Sep 17 00:00:00 2001
From: David Bold <dave@ipp.mpg.de>
Date: Wed, 12 Mar 2025 09:16:05 +0100
Subject: [PATCH 027/129] CI: Avoid issues with special characters

---
 .github/workflows/clang-format.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/clang-format.yml b/.github/workflows/clang-format.yml
index a6508a2dcd..d99b370810 100644
--- a/.github/workflows/clang-format.yml
+++ b/.github/workflows/clang-format.yml
@@ -22,7 +22,7 @@ jobs:
 
       - name: Run clang-format
         id: format
-        run: git clang-format origin/${{ github.base_ref }} || :
+        run: 'git clang-format origin/${{ github.base_ref }} || :'
 
       - name: Commit to the PR branch
         uses: stefanzweifel/git-auto-commit-action@v5

From dfa31b2870962ff86c76679ec5a16f358a4186b1 Mon Sep 17 00:00:00 2001
From: David Bold <dave@ipp.mpg.de>
Date: Wed, 12 Mar 2025 09:50:40 +0100
Subject: [PATCH 028/129] CI: run git-clang-format until there are no more
 changes

That might format more code at once, but should avoid
a CI loop.
---
 .github/workflows/clang-format.yml | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/.github/workflows/clang-format.yml b/.github/workflows/clang-format.yml
index d99b370810..5e25154300 100644
--- a/.github/workflows/clang-format.yml
+++ b/.github/workflows/clang-format.yml
@@ -22,7 +22,11 @@ jobs:
 
       - name: Run clang-format
         id: format
-        run: 'git clang-format origin/${{ github.base_ref }} || :'
+        run:
+          while ! git clang-format origin/${{ github.base_ref }}
+          do
+            true
+          done
 
       - name: Commit to the PR branch
         uses: stefanzweifel/git-auto-commit-action@v5

From e743eb06f5c38e2d8feefc9c652268bbc6b7480f Mon Sep 17 00:00:00 2001
From: David Bold <dave@ipp.mpg.de>
Date: Wed, 12 Mar 2025 11:06:31 +0100
Subject: [PATCH 029/129] CI: use one line

---
 .github/workflows/clang-format.yml | 5 +----
 1 file changed, 1 insertion(+), 4 deletions(-)

diff --git a/.github/workflows/clang-format.yml b/.github/workflows/clang-format.yml
index 5e25154300..3b8cf6ee50 100644
--- a/.github/workflows/clang-format.yml
+++ b/.github/workflows/clang-format.yml
@@ -23,10 +23,7 @@ jobs:
       - name: Run clang-format
         id: format
         run:
-          while ! git clang-format origin/${{ github.base_ref }}
-          do
-            true
-          done
+          while ! git clang-format origin/${{ github.base_ref }} ; do true ; done
 
       - name: Commit to the PR branch
         uses: stefanzweifel/git-auto-commit-action@v5

From 1cb5277a6d288cc2f2f89c1ca840ede7e11faf52 Mon Sep 17 00:00:00 2001
From: David Bold <dave@ipp.mpg.de>
Date: Wed, 12 Mar 2025 11:16:07 +0100
Subject: [PATCH 030/129] CI: stage before we run git-clang-format again

---
 .github/workflows/clang-format.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/clang-format.yml b/.github/workflows/clang-format.yml
index 3b8cf6ee50..49dfb31e25 100644
--- a/.github/workflows/clang-format.yml
+++ b/.github/workflows/clang-format.yml
@@ -23,7 +23,7 @@ jobs:
       - name: Run clang-format
         id: format
         run:
-          while ! git clang-format origin/${{ github.base_ref }} ; do true ; done
+          while ! git clang-format origin/${{ github.base_ref }} ; do git add . ; done
 
       - name: Commit to the PR branch
         uses: stefanzweifel/git-auto-commit-action@v5

From 9d1b46908fab0c61950905eefa73ad735b4a4c27 Mon Sep 17 00:00:00 2001
From: Rob Falgout <rfalgout@llnl.gov>
Date: Wed, 19 Mar 2025 14:39:19 -0700
Subject: [PATCH 031/129] Turn off test for false convergence in hypre GMRES
 solver

---
 include/bout/hypre_interface.hxx | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/include/bout/hypre_interface.hxx b/include/bout/hypre_interface.hxx
index 33e6218c8f..1837d5e275 100644
--- a/include/bout/hypre_interface.hxx
+++ b/include/bout/hypre_interface.hxx
@@ -1034,7 +1034,8 @@ public:
 
     switch (solver_type) {
     case HYPRE_SOLVER_TYPE::gmres: {
-      HYPRE_ParCSRGMRESSetKDim(solver, 30); // TODO: Make this an input file parameter
+      HYPRE_ParCSRGMRESSetKDim(solver, 30);           // TODO: Make this an input file parameter
+      HYPRE_GMRESSetSkipRealResidualCheck(solver, 1); // TODO: Make this an input file parameter
       break;
     }
     case HYPRE_SOLVER_TYPE::bicgstab: {

From f969c011249b60b337817432c026b1bd312291cc Mon Sep 17 00:00:00 2001
From: Ben Dudson <dudson2@llnl.gov>
Date: Wed, 19 Mar 2025 14:43:14 -0700
Subject: [PATCH 032/129] hypre_interface: Add kdim and
 skip_real_residual_check options

These options control the GMRES solver.
---
 include/bout/hypre_interface.hxx | 12 ++++++++++--
 1 file changed, 10 insertions(+), 2 deletions(-)

diff --git a/include/bout/hypre_interface.hxx b/include/bout/hypre_interface.hxx
index 1837d5e275..15ca97cb8a 100644
--- a/include/bout/hypre_interface.hxx
+++ b/include/bout/hypre_interface.hxx
@@ -1034,8 +1034,16 @@ public:
 
     switch (solver_type) {
     case HYPRE_SOLVER_TYPE::gmres: {
-      HYPRE_ParCSRGMRESSetKDim(solver, 30);           // TODO: Make this an input file parameter
-      HYPRE_GMRESSetSkipRealResidualCheck(solver, 1); // TODO: Make this an input file parameter
+      HYPRE_ParCSRGMRESSetKDim(solver,
+                               options["kdim"]
+                                 .doc("Set the maximum size of the Krylov space")
+                                 .withDefault(30));
+
+      if (options["skip_real_residual_check"]
+          .doc("Skip the evaluation and the check of the actual residual?")
+          .withDefault<bool>(false)) {
+        HYPRE_GMRESSetSkipRealResidualCheck(solver, 1);
+      }
       break;
     }
     case HYPRE_SOLVER_TYPE::bicgstab: {

From 3aed489c6cbb56137260860c63c4d32b9bd8029b Mon Sep 17 00:00:00 2001
From: Norbert Podhorszki <pnorbert@ornl.gov>
Date: Fri, 26 Apr 2024 09:41:34 -0400
Subject: [PATCH 033/129] Add attributes to ADIOS2 output to "define"
 dimensions as names. We need this for xarray support that is designed for the
 NetCDF model, where dimensions are separately defined entities.

---
 include/bout/adios_object.hxx     |  8 +++++++-
 src/sys/options/options_adios.cxx | 24 ++++++++++++++++++------
 2 files changed, 25 insertions(+), 7 deletions(-)

diff --git a/include/bout/adios_object.hxx b/include/bout/adios_object.hxx
index b14316f1ba..12da8ce4c7 100755
--- a/include/bout/adios_object.hxx
+++ b/include/bout/adios_object.hxx
@@ -57,11 +57,17 @@ public:
   }
 
   template <class T>
-  adios2::Variable<T> GetArrayVariable(const std::string& varname, adios2::Dims& shape) {
+  adios2::Variable<T> GetArrayVariable(const std::string& varname, adios2::Dims& shape,
+                                       const std::vector<std::string>& dimNames,
+                                       int rank) {
     adios2::Variable<T> v = io.InquireVariable<T>(varname);
     if (!v) {
       adios2::Dims start(shape.size());
       v = io.DefineVariable<T>(varname, shape, start, shape);
+      if (!rank && dimNames.size()) {
+        io.DefineAttribute<std::string>("__xarray_dimensions__", dimNames.data(),
+                                        dimNames.size(), varname, "/", true);
+      }
     } else {
       v.SetShape(shape);
     }
diff --git a/src/sys/options/options_adios.cxx b/src/sys/options/options_adios.cxx
index b3acbaada6..09797647ed 100644
--- a/src/sys/options/options_adios.cxx
+++ b/src/sys/options/options_adios.cxx
@@ -307,6 +307,12 @@ void OptionsADIOS::verifyTimesteps() const {
   return;
 }
 
+const std::vector<std::string> DIMS_NONE;
+const std::vector<std::string> DIMS_X = {"x"};
+const std::vector<std::string> DIMS_XY = {"x", "y"};
+const std::vector<std::string> DIMS_XZ = {"x", "z"};
+const std::vector<std::string> DIMS_XYZ = {"x", "y", "z"};
+
 /// Visit a variant type, and put the data into a NcVar
 struct ADIOSPutVarVisitor {
   ADIOSPutVarVisitor(const std::string& name, ADIOSStream& stream)
@@ -388,7 +394,8 @@ void ADIOSPutVarVisitor::operator()<Field2D>(const Field2D& value) {
   adios2::Dims memCount = {static_cast<size_t>(value.getNx()),
                            static_cast<size_t>(value.getNy())};
 
-  adios2::Variable<BoutReal> var = stream.GetArrayVariable<BoutReal>(varname, shape);
+  adios2::Variable<BoutReal> var =
+      stream.GetArrayVariable<BoutReal>(varname, shape, DIMS_XY, BoutComm::rank());
   var.SetSelection({start, count});
   var.SetMemorySelection({memStart, memCount});
   stream.engine.Put<BoutReal>(var, &value(0, 0));
@@ -425,7 +432,8 @@ void ADIOSPutVarVisitor::operator()<Field3D>(const Field3D& value) {
                            static_cast<size_t>(value.getNy()),
                            static_cast<size_t>(value.getNz())};
 
-  adios2::Variable<BoutReal> var = stream.GetArrayVariable<BoutReal>(varname, shape);
+  adios2::Variable<BoutReal> var =
+      stream.GetArrayVariable<BoutReal>(varname, shape, DIMS_XYZ, BoutComm::rank());
   var.SetSelection({start, count});
   var.SetMemorySelection({memStart, memCount});
   stream.engine.Put<BoutReal>(var, &value(0, 0, 0));
@@ -457,7 +465,8 @@ void ADIOSPutVarVisitor::operator()<FieldPerp>(const FieldPerp& value) {
   adios2::Dims memCount = {static_cast<size_t>(value.getNx()),
                            static_cast<size_t>(value.getNz())};
 
-  adios2::Variable<BoutReal> var = stream.GetArrayVariable<BoutReal>(varname, shape);
+  adios2::Variable<BoutReal> var =
+      stream.GetArrayVariable<BoutReal>(varname, shape, DIMS_XZ, BoutComm::rank());
   var.SetSelection({start, count});
   var.SetMemorySelection({memStart, memCount});
   stream.engine.Put<BoutReal>(var, &value(0, 0));
@@ -469,7 +478,8 @@ void ADIOSPutVarVisitor::operator()<Array<BoutReal>>(const Array<BoutReal>& valu
   adios2::Dims shape = {(size_t)BoutComm::size(), (size_t)value.size()};
   adios2::Dims start = {(size_t)BoutComm::rank(), 0};
   adios2::Dims count = {1, shape[1]};
-  adios2::Variable<BoutReal> var = stream.GetArrayVariable<BoutReal>(varname, shape);
+  adios2::Variable<BoutReal> var =
+      stream.GetArrayVariable<BoutReal>(varname, shape, DIMS_NONE, BoutComm::rank());
   var.SetSelection({start, count});
   stream.engine.Put<BoutReal>(var, value.begin());
 }
@@ -482,7 +492,8 @@ void ADIOSPutVarVisitor::operator()<Matrix<BoutReal>>(const Matrix<BoutReal>& va
                         (size_t)std::get<1>(s)};
   adios2::Dims start = {(size_t)BoutComm::rank(), 0, 0};
   adios2::Dims count = {1, shape[1], shape[2]};
-  adios2::Variable<BoutReal> var = stream.GetArrayVariable<BoutReal>(varname, shape);
+  adios2::Variable<BoutReal> var =
+      stream.GetArrayVariable<BoutReal>(varname, shape, DIMS_NONE, BoutComm::rank());
   var.SetSelection({start, count});
   stream.engine.Put<BoutReal>(var, value.begin());
 }
@@ -495,7 +506,8 @@ void ADIOSPutVarVisitor::operator()<Tensor<BoutReal>>(const Tensor<BoutReal>& va
                         (size_t)std::get<1>(s), (size_t)std::get<2>(s)};
   adios2::Dims start = {(size_t)BoutComm::rank(), 0, 0, 0};
   adios2::Dims count = {1, shape[1], shape[2], shape[3]};
-  adios2::Variable<BoutReal> var = stream.GetArrayVariable<BoutReal>(varname, shape);
+  adios2::Variable<BoutReal> var =
+      stream.GetArrayVariable<BoutReal>(varname, shape, DIMS_NONE, BoutComm::rank());
   var.SetSelection({start, count});
   stream.engine.Put<BoutReal>(var, value.begin());
 }

From d43cea2ee40a654898a4b4e4801aeb4934bb800d Mon Sep 17 00:00:00 2001
From: Seimon Powell <seimon.powell@ukaea.uk>
Date: Thu, 24 Apr 2025 14:54:20 +0100
Subject: [PATCH 034/129] Enable alternative stencil shapes in jocobian
 colouring

4 new options added

solver:stencil:<cross,square,taxi> = N where <option> is either cross, square, or taxi:
cross - all points (|x| == 0 and |y| <= N) or (|x| <= N and |y| == 0)
square - all points |x| < N or |y| < N
taxi - all points |x| + |y| < N
can be combined will just create a union of every stencil
New default is solver:stencil:taxi = 2
Also option to force colouring matrix to be symmetric
solver:force_symmetric_coloring=true
---
 src/solver/impls/snes/snes.cxx | 905 ++++++++++-----------------------
 1 file changed, 270 insertions(+), 635 deletions(-)

diff --git a/src/solver/impls/snes/snes.cxx b/src/solver/impls/snes/snes.cxx
index e382bbd3f8..aec986511f 100644
--- a/src/solver/impls/snes/snes.cxx
+++ b/src/solver/impls/snes/snes.cxx
@@ -1,4 +1,4 @@
-#include "bout/build_defines.hxx"
+#include "bout/build_config.hxx"
 
 #if BOUT_HAS_PETSC
 
@@ -9,15 +9,52 @@
 #include <bout/msg_stack.hxx>
 #include <bout/utils.hxx>
 
-#include <array>
 #include <cmath>
 #include <vector>
 
 #include <bout/output.hxx>
 
-#include "petscmat.h"
 #include "petscsnes.h"
 
+class ColoringStencil {
+private:
+  bool static in_compact(int const i, int const j, int const n_compact) {
+    return std::abs(i) <= n_compact && std::abs(j) <= n_compact;
+  }
+  bool static in_cross(int const i, int const j, int const n_cross) {
+    if (i == 0) {
+      return std::abs(j) <= n_cross;
+    }
+    if (j == 0) {
+      return std::abs(i) <= n_cross;
+    }
+    return false;
+  }
+  bool static in_taxi(int const i, int const j, int const n_taxi) {
+    return std::abs(i) + std::abs(j) <= n_taxi;
+  }
+
+public:
+  auto static get_offsets(int n_compact, int n_taxi, int n_cross) {
+    ASSERT2(n_compact >= 0 && n_cross >= 0 && n_taxi >= 0
+            && n_compact + n_cross + n_taxi > 0);
+    auto inside = [&](int i, int j) {
+      return in_compact(i, j, n_compact) || in_taxi(i, j, n_taxi)
+             || in_cross(i, j, n_cross);
+    };
+    std::vector<std::pair<int, int>> xyoffset;
+    auto loop_bound = std::max({n_compact, n_taxi, n_cross});
+    for (int i = -loop_bound; i <= loop_bound; ++i) {
+      for (int j = -loop_bound; j <= loop_bound; ++j) {
+        if (inside(i, j)) {
+          xyoffset.emplace_back(i, j);
+        }
+      }
+    }
+    return xyoffset;
+  }
+};
+
 /*
  * PETSc callback function, which evaluates the nonlinear
  * function to be solved by SNES.
@@ -120,31 +157,12 @@ SNESSolver::SNESSolver(Options* opts)
       matrix_free((*options)["matrix_free"]
                       .doc("Use matrix free Jacobian?")
                       .withDefault<bool>(false)),
-      matrix_free_operator((*options)["matrix_free_operator"]
-                               .doc("Use matrix free Jacobian-vector operator?")
-                               .withDefault<bool>(true)),
       lag_jacobian((*options)["lag_jacobian"]
                        .doc("Re-use the Jacobian this number of SNES iterations")
                        .withDefault(50)),
       use_coloring((*options)["use_coloring"]
                        .doc("Use matrix coloring to calculate Jacobian?")
-                       .withDefault<bool>(true)),
-      jacobian_recalculated(false),
-      prune_jacobian((*options)["prune_jacobian"]
-                         .doc("Remove small elements in the Jacobian?")
-                         .withDefault<bool>(false)),
-      prune_abstol((*options)["prune_abstol"]
-                       .doc("Prune values with absolute values smaller than this")
-                       .withDefault<BoutReal>(1e-16)),
-      prune_fraction((*options)["prune_fraction"]
-                         .doc("Prune if fraction of small elements is larger than this")
-                         .withDefault<BoutReal>(0.2)),
-      scale_rhs((*options)["scale_rhs"]
-                    .doc("Scale time derivatives (Jacobian row scaling)?")
-                    .withDefault<bool>(false)),
-      scale_vars((*options)["scale_vars"]
-                     .doc("Scale variables (Jacobian column scaling)?")
-                     .withDefault<bool>(false)) {}
+                       .withDefault<bool>(true)) {}
 
 int SNESSolver::init() {
 
@@ -184,38 +202,12 @@ int SNESSolver::init() {
 
   if (equation_form == BoutSnesEquationForm::rearranged_backward_euler) {
     // Need an intermediate vector for rearranged Backward Euler
-    ierr = VecDuplicate(snes_x, &delta_x);
-    CHKERRQ(ierr);
+    VecDuplicate(snes_x, &delta_x);
   }
 
   if (predictor) {
     // Storage for previous solution
-    ierr = VecDuplicate(snes_x, &x1);
-    CHKERRQ(ierr);
-  }
-
-  if (scale_rhs) {
-    // Storage for rhs factors, one per evolving variable
-    ierr = VecDuplicate(snes_x, &rhs_scaling_factors);
-    CHKERRQ(ierr);
-    // Set all factors to 1 to start with
-    ierr = VecSet(rhs_scaling_factors, 1.0);
-    CHKERRQ(ierr);
-    // Array to store inverse Jacobian row norms
-    ierr = VecDuplicate(snes_x, &jac_row_inv_norms);
-    CHKERRQ(ierr);
-  }
-
-  if (scale_vars) {
-    // Storage for var factors, one per evolving variable
-    ierr = VecDuplicate(snes_x, &var_scaling_factors);
-    CHKERRQ(ierr);
-    // Set all factors to 1 to start with
-    ierr = VecSet(var_scaling_factors, 1.0);
-    CHKERRQ(ierr);
-    // Storage for scaled 'x' state vectors
-    ierr = VecDuplicate(snes_x, &scaled_x);
-    CHKERRQ(ierr);
+    VecDuplicate(snes_x, &x1);
   }
 
   // Nonlinear solver interface (SNES)
@@ -235,7 +227,7 @@ int SNESSolver::init() {
   }
 
   // Set up the Jacobian
-  if (matrix_free or matrix_free_operator) {
+  if (matrix_free) {
     /*
       PETSc SNES matrix free Jacobian, using a different
       operator for differencing.
@@ -251,17 +243,12 @@ int SNESSolver::init() {
     // Set a function to be called for differencing
     // This can be a linearised form of the SNES function
     MatMFFDSetFunction(Jmf, FormFunctionForDifferencing, this);
-  }
 
-  if (matrix_free) {
-    // Use matrix free for both operator and preconditioner
     // Calculate Jacobian matrix free using FormFunctionForDifferencing
     SNESSetJacobian(snes, Jmf, Jmf, MatMFFDComputeJacobian, this);
 
   } else {
-    // Calculate the Jacobian using finite differences.
-    // The finite difference Jacobian (Jfd) may be used for both operator
-    // and preconditioner or, if matrix_free_operator, in only the preconditioner.
+    // Calculate the Jacobian using finite differences
     if (use_coloring) {
       // Use matrix coloring
       // This greatly reduces the number of times the rhs() function needs
@@ -279,263 +266,203 @@ int SNESSolver::init() {
 
       output_progress.write("Setting Jacobian matrix sizes\n");
 
+      int localN = getLocalN(); // Number of rows on this processor
       int n2d = f2d.size();
       int n3d = f3d.size();
 
-      // Set size of Matrix on each processor to nlocal x nlocal
-      MatCreate(BoutComm::get(), &Jfd);
-      MatSetSizes(Jfd, nlocal, nlocal, PETSC_DETERMINE, PETSC_DETERMINE);
-      MatSetFromOptions(Jfd);
-
-      std::vector<PetscInt> d_nnz(nlocal);
-      std::vector<PetscInt> o_nnz(nlocal);
-
-      // Set values for most points
-      const int ncells_x = (mesh->LocalNx > 1) ? 2 : 0;
-      const int ncells_y = (mesh->LocalNy > 1) ? 2 : 0;
-      const int ncells_z = (mesh->LocalNz > 1) ? 2 : 0;
-
-      const auto star_pattern = (1 + ncells_x + ncells_y) * (n3d + n2d) + ncells_z * n3d;
-
-      // Offsets. Start with the central cell
-      std::vector<std::pair<int, int>> xyoffsets{{0, 0}};
-      if (ncells_x != 0) {
-        // Stencil includes points in X
-        xyoffsets.push_back({-1, 0});
-        xyoffsets.push_back({1, 0});
-      }
-      if (ncells_y != 0) {
-        // Stencil includes points in Y
-        xyoffsets.push_back({0, -1});
-        xyoffsets.push_back({0, 1});
+      // Set size of Matrix on each processor to localN x localN
+      MatCreate(BoutComm::get(), &Jmf);
+      MatSetSizes(Jmf, localN, localN, PETSC_DETERMINE, PETSC_DETERMINE);
+      MatSetFromOptions(Jmf);
+      // Determine which row/columns of the matrix are locally owned
+      int Istart, Iend;
+      MatGetOwnershipRange(Jmf, &Istart, &Iend);
+      // Convert local into global indices
+      // Note: Not in the boundary cells, to keep -1 values
+      for (const auto& i : mesh->getRegion3D("RGN_NOBNDRY")) {
+        index[i] += Istart;
       }
+      // Now communicate to fill guard cells
+      mesh->communicate(index);
 
-      output_info.write("Star pattern: {} non-zero entries\n", star_pattern);
-      for (int i = 0; i < nlocal; i++) {
-        // Non-zero elements on this processor
-        d_nnz[i] = star_pattern;
-        // Non-zero elements on neighboring processor
-        o_nnz[i] = 0;
+      // Non-zero elements on this processor
+      std::vector<PetscInt> d_nnz;
+      std::vector<PetscInt> o_nnz;
+      auto n_square = (*options)["stencil:square"]
+                          .doc("Extent of stencil (square)")
+                          .withDefault<int>(0);
+      auto n_taxi = (*options)["stencil:taxi"]
+                        .doc("Extent of stencil (taxi-cab norm)")
+                        .withDefault<int>(0);
+      auto n_cross = (*options)["stencil:cross"]
+                         .doc("Extent of stencil (cross)")
+                         .withDefault<int>(0);
+      //Set n_taxi 2 if nothing else is set
+      //TODO: Probably a better way to do this
+      if (n_square == 0 && n_taxi == 0 && n_cross == 0) {
+        output_info.write("Setting beuler:stencil:taxi = 2\n");
+        n_taxi = 2;
       }
 
-      // X boundaries
-      if (ncells_x != 0) {
-        if (mesh->firstX()) {
-          // Lower X boundary
-          for (int y = mesh->ystart; y <= mesh->yend; y++) {
-            for (int z = 0; z < mesh->LocalNz; z++) {
-              const int localIndex = ROUND(index(mesh->xstart, y, z));
-              ASSERT2((localIndex >= 0) && (localIndex < nlocal));
-              const int num_fields = (z == 0) ? n2d + n3d : n3d;
-              for (int i = 0; i < num_fields; i++) {
-                d_nnz[localIndex + i] -= (n3d + n2d);
-              }
-            }
-          }
-        } else {
-          // On another processor
-          for (int y = mesh->ystart; y <= mesh->yend; y++) {
-            for (int z = 0; z < mesh->LocalNz; z++) {
-              const int localIndex = ROUND(index(mesh->xstart, y, z));
-              ASSERT2((localIndex >= 0) && (localIndex < nlocal));
-              const int num_fields = (z == 0) ? n2d + n3d : n3d;
-              for (int i = 0; i < num_fields; i++) {
-                d_nnz[localIndex + i] -= (n3d + n2d);
-                o_nnz[localIndex + i] += (n3d + n2d);
-              }
-            }
-          }
-        }
-        if (mesh->lastX()) {
-          // Upper X boundary
-          for (int y = mesh->ystart; y <= mesh->yend; y++) {
-            for (int z = 0; z < mesh->LocalNz; z++) {
-              const int localIndex = ROUND(index(mesh->xend, y, z));
-              ASSERT2((localIndex >= 0) && (localIndex < nlocal));
-              const int num_fields = (z == 0) ? n2d + n3d : n3d;
-              for (int i = 0; i < num_fields; i++) {
-                d_nnz[localIndex + i] -= (n3d + n2d);
-              }
-            }
-          }
-        } else {
-          // On another processor
+      auto const xyoffsets = ColoringStencil::get_offsets(n_square, n_taxi, n_cross);
+      {
+        //This is nasty but can't think of a better and robust way to
+        //count the non-zeros for some arbitery stencil
+        std::vector<std::set<int>> d_nnz_map2d(localN);
+        std::vector<std::set<int>> o_nnz_map2d(localN);
+        std::vector<std::set<int>> d_nnz_map3d(localN);
+        std::vector<std::set<int>> o_nnz_map3d(localN);
+        //Loop over every element in 2D to count the *unique* non-zeros
+        for (int x = mesh->xstart; x <= mesh->xend; x++) {
           for (int y = mesh->ystart; y <= mesh->yend; y++) {
-            for (int z = 0; z < mesh->LocalNz; z++) {
-              const int localIndex = ROUND(index(mesh->xend, y, z));
-              ASSERT2((localIndex >= 0) && (localIndex < nlocal));
-              const int num_fields = (z == 0) ? n2d + n3d : n3d;
-              for (int i = 0; i < num_fields; i++) {
-                d_nnz[localIndex + i] -= (n3d + n2d);
-                o_nnz[localIndex + i] += (n3d + n2d);
-              }
-            }
-          }
-        }
-      }
 
-      // Y boundaries
-      if (ncells_y != 0) {
-        for (int x = mesh->xstart; x <= mesh->xend; x++) {
-          // Default to no boundary
-          // NOTE: This assumes that communications in Y are to other
-          //   processors. If Y is communicated with this processor (e.g. NYPE=1)
-          //   then this will result in PETSc warnings about out of range allocations
-
-          // z = 0 case
-          int localIndex = ROUND(index(x, mesh->ystart, 0));
-          ASSERT2(localIndex >= 0);
-
-          // All 2D and 3D fields
-          for (int i = 0; i < n2d + n3d; i++) {
-            o_nnz[localIndex + i] += (n3d + n2d);
-            d_nnz[localIndex + i] -= (n3d + n2d);
-          }
+            int ind0 = ROUND(index(x, y, 0)) - Istart;
 
-          for (int z = 1; z < mesh->LocalNz; z++) {
-            localIndex = ROUND(index(x, mesh->ystart, z));
+            // 2D fields
+            for (int i = 0; i < n2d; i++) {
+              PetscInt row = ind0 + i;
+              //if (row < Istart || row >= Iend) continue;
+              // Loop through each point in the stencil
+              for (const auto& [x_off, y_off] : xyoffsets) {
+                int xi = x + x_off;
+                int yi = y + y_off;
+                if ((xi < 0) || (yi < 0) || (xi >= mesh->LocalNx)
+                    || (yi >= mesh->LocalNy)) {
+                  continue;
+                }
 
-            // Only 3D fields
-            for (int i = 0; i < n3d; i++) {
-              o_nnz[localIndex + i] += (n3d + n2d);
-              d_nnz[localIndex + i] -= (n3d + n2d);
+                int ind2 = ROUND(index(xi, yi, 0));
+                if (ind2 < 0) {
+                  continue; // A boundary point
+                }
+
+                // Depends on all variables on this cell
+                for (int j = 0; j < n2d; j++) {
+                  PetscInt col = ind2 + j;
+                  if (col >= Istart && col < Iend) {
+                    d_nnz_map2d[row].insert(col);
+                  } else {
+                    o_nnz_map2d[row].insert(col);
+                  }
+                }
+              }
             }
-          }
+            // 3D fields
+            for (int z = 0; z < mesh->LocalNz; z++) {
+              int ind = ROUND(index(x, y, z)) - Istart;
 
-          // z = 0 case
-          localIndex = ROUND(index(x, mesh->yend, 0));
-          // All 2D and 3D fields
-          for (int i = 0; i < n2d + n3d; i++) {
-            o_nnz[localIndex + i] += (n3d + n2d);
-            d_nnz[localIndex + i] -= (n3d + n2d);
-          }
+              for (int i = 0; i < n3d; i++) {
+                PetscInt row = ind + i;
+                //if (row < Istart || row >= Iend) continue;
+                if (z == 0) {
+                  row += n2d;
+                }
 
-          for (int z = 1; z < mesh->LocalNz; z++) {
-            localIndex = ROUND(index(x, mesh->yend, z));
+                // Depends on 2D fields
+                for (int j = 0; j < n2d; j++) {
+                  PetscInt col = ind0 + j;
+                  if (col >= Istart && col < Iend) {
+                    d_nnz_map2d[row].insert(col);
+                  } else {
+                    o_nnz_map2d[row].insert(col);
+                  }
+                }
 
-            // Only 3D fields
-            for (int i = 0; i < n3d; i++) {
-              o_nnz[localIndex + i] += (n3d + n2d);
-              d_nnz[localIndex + i] -= (n3d + n2d);
-            }
-          }
-        }
+                // Star pattern
+                for (const auto& [x_off, y_off] : xyoffsets) {
+                  int xi = x + x_off;
+                  int yi = y + y_off;
 
-        for (RangeIterator it = mesh->iterateBndryLowerY(); !it.isDone(); it++) {
-          // A boundary, so no communication
+                  if ((xi < 0) || (yi < 0) || (xi > mesh->LocalNx)
+                      || (yi > mesh->LocalNy)) {
+                    continue;
+                  }
 
-          // z = 0 case
-          int localIndex = ROUND(index(it.ind, mesh->ystart, 0));
-          if (localIndex < 0) {
-            // This can occur because it.ind includes values in x boundary e.g. x=0
-            continue;
-          }
-          // All 2D and 3D fields
-          for (int i = 0; i < n2d + n3d; i++) {
-            o_nnz[localIndex + i] -= (n3d + n2d);
-          }
+                  int ind2 = ROUND(index(xi, yi, 0));
+                  if (ind2 < 0) {
+                    continue; // Boundary point
+                  }
 
-          for (int z = 1; z < mesh->LocalNz; z++) {
-            int localIndex = ROUND(index(it.ind, mesh->ystart, z));
+                  if (z == 0) {
+                    ind2 += n2d;
+                  }
 
-            // Only 3D fields
-            for (int i = 0; i < n3d; i++) {
-              o_nnz[localIndex + i] -= (n3d + n2d);
+                  // 3D fields on this cell
+                  for (int j = 0; j < n3d; j++) {
+                    PetscInt col = ind2 + j;
+                    if (col >= Istart && col < Iend) {
+                      d_nnz_map3d[row].insert(col);
+                    } else {
+                      o_nnz_map3d[row].insert(col);
+                    }
+                  }
+                }
+              }
             }
           }
         }
 
-        for (RangeIterator it = mesh->iterateBndryUpperY(); !it.isDone(); it++) {
-          // A boundary, so no communication
-
-          // z = 0 case
-          const int localIndex = ROUND(index(it.ind, mesh->yend, 0));
-          if (localIndex < 0) {
-            continue; // Out of domain
-          }
-
-          // All 2D and 3D fields
-          for (int i = 0; i < n2d + n3d; i++) {
-            o_nnz[localIndex + i] -= (n3d + n2d);
-          }
-
-          for (int z = 1; z < mesh->LocalNz; z++) {
-            const int localIndex = ROUND(index(it.ind, mesh->yend, z));
+        d_nnz.reserve(localN);
+        d_nnz.reserve(localN);
 
-            // Only 3D fields
-            for (int i = 0; i < n3d; i++) {
-              o_nnz[localIndex + i] -= (n3d + n2d);
-            }
-          }
+        for (int i = 0; i < localN; ++i) {
+          //Assume all elements in the z direction are potentially coupled
+          d_nnz.emplace_back(d_nnz_map3d[i].size() * mesh->LocalNz
+                             + d_nnz_map2d[i].size());
+          o_nnz.emplace_back(o_nnz_map3d[i].size() * mesh->LocalNz
+                             + o_nnz_map2d[i].size());
         }
       }
 
       output_progress.write("Pre-allocating Jacobian\n");
-
       // Pre-allocate
-      MatMPIAIJSetPreallocation(Jfd, 0, d_nnz.data(), 0, o_nnz.data());
-      MatSeqAIJSetPreallocation(Jfd, 0, d_nnz.data());
-      MatSetUp(Jfd);
-      MatSetOption(Jfd, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE);
+      MatMPIAIJSetPreallocation(Jmf, 0, d_nnz.data(), 0, o_nnz.data());
+      MatSeqAIJSetPreallocation(Jmf, 0, d_nnz.data());
+      MatSetUp(Jmf);
+      MatSetOption(Jmf, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE);
 
-      // Determine which row/columns of the matrix are locally owned
-      int Istart, Iend;
-      MatGetOwnershipRange(Jfd, &Istart, &Iend);
-
-      // Convert local into global indices
-      // Note: Not in the boundary cells, to keep -1 values
-      for (const auto& i : mesh->getRegion3D("RGN_NOBNDRY")) {
-        index[i] += Istart;
-      }
-
-      // Now communicate to fill guard cells
-      mesh->communicate(index);
+      //  // Determine which row/columns of the matrix are locally owned
+      //  int Istart, Iend;
+      //  MatGetOwnershipRange(Jmf, &Istart, &Iend);
 
       //////////////////////////////////////////////////
       // Mark non-zero entries
 
       output_progress.write("Marking non-zero Jacobian entries\n");
-
-      const PetscScalar val = 1.0;
-
+      PetscScalar val = 1.0;
       for (int x = mesh->xstart; x <= mesh->xend; x++) {
         for (int y = mesh->ystart; y <= mesh->yend; y++) {
 
-          const int ind0 = ROUND(index(x, y, 0));
+          int ind0 = ROUND(index(x, y, 0));
 
           // 2D fields
           for (int i = 0; i < n2d; i++) {
-            const PetscInt row = ind0 + i;
-
-            // Loop through each point in the 5-point stencil
-            for (const auto& xyoffset : xyoffsets) {
-              const int xi = x + xyoffset.first;
-              const int yi = y + xyoffset.second;
+            PetscInt row = ind0 + i;
 
-              if ((xi < 0) || (yi < 0) || (xi >= mesh->LocalNx)
-                  || (yi >= mesh->LocalNy)) {
+            // Loop through each point in the stencil
+            for (const auto& [x_off, y_off] : xyoffsets) {
+              int xi = x + x_off;
+              int yi = y + y_off;
+              if ((xi < 0) || (yi < 0) || (xi > mesh->LocalNx) || (yi > mesh->LocalNy)) {
                 continue;
               }
 
-              const int ind2 = ROUND(index(xi, yi, 0));
-
+              int ind2 = ROUND(index(xi, yi, 0));
               if (ind2 < 0) {
                 continue; // A boundary point
               }
 
               // Depends on all variables on this cell
               for (int j = 0; j < n2d; j++) {
-                const PetscInt col = ind2 + j;
-                ierr = MatSetValues(Jfd, 1, &row, 1, &col, &val, INSERT_VALUES);
+                PetscInt col = ind2 + j;
+                ierr = MatSetValues(Jmf, 1, &row, 1, &col, &val, INSERT_VALUES);
                 CHKERRQ(ierr);
               }
             }
           }
-
           // 3D fields
           for (int z = 0; z < mesh->LocalNz; z++) {
-
-            const int ind = ROUND(index(x, y, z));
+            int ind = ROUND(index(x, y, z));
 
             for (int i = 0; i < n3d; i++) {
               PetscInt row = ind + i;
@@ -545,94 +472,93 @@ int SNESSolver::init() {
 
               // Depends on 2D fields
               for (int j = 0; j < n2d; j++) {
-                const PetscInt col = ind0 + j;
-                ierr = MatSetValues(Jfd, 1, &row, 1, &col, &val, INSERT_VALUES);
+                PetscInt col = ind0 + j;
+                ierr = MatSetValues(Jmf, 1, &row, 1, &col, &val, INSERT_VALUES);
                 CHKERRQ(ierr);
               }
 
               // Star pattern
-              for (const auto& xyoffset : xyoffsets) {
-                const int xi = x + xyoffset.first;
-                const int yi = y + xyoffset.second;
+              for (const auto& [x_off, y_off] : xyoffsets) {
+                int xi = x + x_off;
+                int yi = y + y_off;
 
                 if ((xi < 0) || (yi < 0) || (xi >= mesh->LocalNx)
                     || (yi >= mesh->LocalNy)) {
                   continue;
                 }
-
-                int ind2 = ROUND(index(xi, yi, z));
-                if (ind2 < 0) {
-                  continue; // Boundary point
-                }
-
-                if (z == 0) {
-                  ind2 += n2d;
-                }
-
-                // 3D fields on this cell
-                for (int j = 0; j < n3d; j++) {
-                  const PetscInt col = ind2 + j;
-                  ierr = MatSetValues(Jfd, 1, &row, 1, &col, &val, INSERT_VALUES);
-                  if (ierr != 0) {
-                    output.write("ERROR: {} : ({}, {}) -> ({}, {}) : {} -> {}\n", row, x,
-                                 y, xi, yi, ind2, ind2 + n3d - 1);
+                for (int zi = 0; zi < mesh->LocalNz; ++zi) {
+                  int ind2 = ROUND(index(xi, yi, zi));
+                  if (ind2 < 0) {
+                    continue; // Boundary point
                   }
-                  CHKERRQ(ierr);
-                }
-              }
-
-              int nz = mesh->LocalNz;
-              if (nz > 1) {
-                // Multiple points in z
 
-                int zp = (z + 1) % nz;
-
-                int ind2 = ROUND(index(x, y, zp));
-                if (zp == 0) {
-                  ind2 += n2d;
-                }
-                for (int j = 0; j < n3d; j++) {
-                  const PetscInt col = ind2 + j;
-                  ierr = MatSetValues(Jfd, 1, &row, 1, &col, &val, INSERT_VALUES);
-                  CHKERRQ(ierr);
-                }
+                  if (z == 0) {
+                    ind2 += n2d;
+                  }
 
-                int zm = (z - 1 + nz) % nz;
-                ind2 = ROUND(index(x, y, zm));
-                if (zm == 0) {
-                  ind2 += n2d;
-                }
-                for (int j = 0; j < n3d; j++) {
-                  const PetscInt col = ind2 + j;
-                  ierr = MatSetValues(Jfd, 1, &row, 1, &col, &val, INSERT_VALUES);
-                  CHKERRQ(ierr);
+                  // 3D fields on this cell
+                  for (int j = 0; j < n3d; j++) {
+                    PetscInt col = ind2 + j;
+                    //printf("%d %d\n",row,col);
+                    ierr = MatSetValues(Jmf, 1, &row, 1, &col, &val, INSERT_VALUES);
+
+                    if (ierr != 0) {
+                      output.write("ERROR: {} {} : ({}, {}) -> ({}, {}) : {} -> {}\n",
+                                   row, x, y, xi, yi, ind2, ind2 + n3d - 1);
+                    }
+                    CHKERRQ(ierr);
+                  }
                 }
               }
             }
           }
         }
       }
+
       // Finished marking non-zero entries
 
       output_progress.write("Assembling Jacobian matrix\n");
 
       // Assemble Matrix
-      MatAssemblyBegin(Jfd, MAT_FINAL_ASSEMBLY);
-      MatAssemblyEnd(Jfd, MAT_FINAL_ASSEMBLY);
+      MatAssemblyBegin(Jmf, MAT_FINAL_ASSEMBLY);
+      MatAssemblyEnd(Jmf, MAT_FINAL_ASSEMBLY);
+
+      //The above will probably miss some non-zero entries at process boundaries
+      //Making sure the colouring matrix is symmetric will in some/all(?)
+      //of the missing non-zeros
+      if ((*options)["force_symmetric_coloring"]
+              .doc("Modifies coloring matrix to force it to be symmetric")
+              .withDefault<bool>(false)) {
+        Mat Jmf_T;
+        MatCreateTranspose(Jmf, &Jmf_T);
+        MatAXPY(Jmf, 1, Jmf_T, DIFFERENT_NONZERO_PATTERN);
+      }
 
       output_progress.write("Creating Jacobian coloring\n");
-      updateColoring();
 
-      if (prune_jacobian) {
-        // Will remove small elements from the Jacobian.
-        // Save a copy to recover from over-pruning
-        ierr = MatDuplicate(Jfd, MAT_SHARE_NONZERO_PATTERN, &Jfd_original);
-        CHKERRQ(ierr);
-      }
+      ISColoring iscoloring;
+
+      MatColoring coloring; // This new in PETSc 3.5
+      MatColoringCreate(Jmf, &coloring);
+      MatColoringSetType(coloring, MATCOLORINGSL);
+      MatColoringSetFromOptions(coloring);
+      // Calculate index sets
+      MatColoringApply(coloring, &iscoloring);
+      MatColoringDestroy(&coloring);
+
+      // Create data structure for SNESComputeJacobianDefaultColor
+      MatFDColoringCreate(Jmf, iscoloring, &fdcoloring);
+      // Set the function to difference
+      MatFDColoringSetFunction(
+          fdcoloring, reinterpret_cast<PetscErrorCode (*)()>(FormFunctionForColoring),
+          this);
+      MatFDColoringSetFromOptions(fdcoloring);
+      MatFDColoringSetUp(Jmf, iscoloring, fdcoloring);
+      ISColoringDestroy(&iscoloring);
+
+      SNESSetJacobian(snes, Jmf, Jmf, SNESComputeJacobianDefaultColor, fdcoloring);
     } else {
       // Brute force calculation
-      // There is usually no reason to use this, except as a check of
-      // the coloring calculation.
 
       MatCreateAIJ(
           BoutComm::get(), nlocal, nlocal,  // Local sizes
@@ -640,20 +566,17 @@ int SNESSolver::init() {
           3, // Number of nonzero entries in diagonal portion of local submatrix
           nullptr,
           0, // Number of nonzeros per row in off-diagonal portion of local submatrix
-          nullptr, &Jfd);
-
-      if (matrix_free_operator) {
-        SNESSetJacobian(snes, Jmf, Jfd, SNESComputeJacobianDefault, this);
-      } else {
-        SNESSetJacobian(snes, Jfd, Jfd, SNESComputeJacobianDefault, this);
-      }
-
-      MatSetOption(Jfd, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_FALSE);
+          nullptr, &Jmf);
+#if PETSC_VERSION_GE(3, 4, 0)
+      SNESSetJacobian(snes, Jmf, Jmf, SNESComputeJacobianDefault, this);
+#else
+      // Before 3.4
+      SNESSetJacobian(snes, Jmf, Jmf, SNESDefaultComputeJacobian, this);
+#endif
+      MatSetOption(Jmf, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_FALSE);
     }
 
     // Re-use Jacobian
-    // Note: If the 'Amat' Jacobian is matrix free, SNESComputeJacobian
-    //       always updates its reference 'u' vector every nonlinear iteration
     SNESSetLagJacobian(snes, lag_jacobian);
     // Set Jacobian and preconditioner to persist across time steps
     SNESSetLagJacobianPersists(snes, PETSC_TRUE);
@@ -664,8 +587,8 @@ int SNESSolver::init() {
   // Set tolerances
   SNESSetTolerances(snes, atol, rtol, stol, maxits, PETSC_DEFAULT);
 
-  // Force SNES to take at least one nonlinear iteration.
-  // This may prevent the solver from getting stuck in false steady state conditions
+// Force SNES to take at least one nonlinear iteration.
+// This may prevent the solver from getting stuck in false steady state conditions
 #if PETSC_VERSION_GE(3, 8, 0)
   SNESSetForceIteration(snes, PETSC_TRUE);
 #endif
@@ -747,7 +670,6 @@ int SNESSolver::init() {
 
 int SNESSolver::run() {
   TRACE("SNESSolver::run()");
-  int ierr;
   // Set initial guess at the solution from variables
   {
     BoutReal* xdata = nullptr;
@@ -764,63 +686,7 @@ int SNESSolver::run() {
     bool looping = true;
     int snes_failures = 0; // Count SNES convergence failures
     int saved_jacobian_lag = 0;
-    int loop_count = 0;
     do {
-      if (scale_vars) {
-        // Individual variable scaling
-        // Note: If variables are rescaled then the Jacobian columns
-        //       need to be scaled or recalculated
-
-        if (loop_count % 100 == 0) {
-          // Rescale state (snes_x) so that all quantities are around 1
-          // If quantities are near zero then RTOL is used
-          int istart, iend;
-          VecGetOwnershipRange(snes_x, &istart, &iend);
-
-          // Take ownership of snes_x and var_scaling_factors data
-          PetscScalar* snes_x_data = nullptr;
-          ierr = VecGetArray(snes_x, &snes_x_data);
-          CHKERRQ(ierr);
-          PetscScalar* x1_data;
-          ierr = VecGetArray(x1, &x1_data);
-          CHKERRQ(ierr);
-          PetscScalar* var_scaling_factors_data;
-          ierr = VecGetArray(var_scaling_factors, &var_scaling_factors_data);
-          CHKERRQ(ierr);
-
-          // Normalise each value in the state
-          // Limit normalisation so scaling factor is never smaller than rtol
-          for (int i = 0; i < iend - istart; ++i) {
-            const PetscScalar norm =
-                BOUTMAX(std::abs(snes_x_data[i]), rtol / var_scaling_factors_data[i]);
-            snes_x_data[i] /= norm;
-            x1_data[i] /= norm; // Update history for predictor
-            var_scaling_factors_data[i] *= norm;
-          }
-
-          // Restore vector underlying data
-          ierr = VecRestoreArray(var_scaling_factors, &var_scaling_factors_data);
-          CHKERRQ(ierr);
-          ierr = VecRestoreArray(x1, &x1_data);
-          CHKERRQ(ierr);
-          ierr = VecRestoreArray(snes_x, &snes_x_data);
-          CHKERRQ(ierr);
-
-          if (diagnose) {
-            // Print maximum and minimum scaling factors
-            PetscReal max_scale, min_scale;
-            VecMax(var_scaling_factors, nullptr, &max_scale);
-            VecMin(var_scaling_factors, nullptr, &min_scale);
-            output.write("Var scaling: {} -> {}\n", min_scale, max_scale);
-          }
-
-          // Force recalculation of the Jacobian
-          SNESGetLagJacobian(snes, &saved_jacobian_lag);
-          SNESSetLagJacobian(snes, 1);
-        }
-      }
-      ++loop_count;
-
       // Copy the state (snes_x) into initial values (x0)
       VecCopy(snes_x, x0);
 
@@ -862,13 +728,6 @@ int SNESSolver::run() {
       // Find out if converged
       SNESConvergedReason reason;
       SNESGetConvergedReason(snes, &reason);
-
-      // Get number of iterations
-      int nl_its;
-      SNESGetIterationNumber(snes, &nl_its);
-      int lin_its;
-      SNESGetLinearSolveIterations(snes, &lin_its);
-
       if ((ierr != 0) or (reason < 0)) {
         // Diverged or SNES failed
 
@@ -899,19 +758,6 @@ int SNESSolver::run() {
         VecCopy(x0, snes_x);
 
         // Recalculate the Jacobian
-        if (jacobian_pruned and (snes_failures > 2) and (4 * lin_its > 3 * maxl)) {
-          // Taking 3/4 of maximum linear iterations on average per linear step
-          // May indicate a preconditioner problem.
-          // Restore pruned non-zero elements
-          if (diagnose) {
-            output.write("\nRestoring Jacobian\n");
-          }
-          ierr = MatCopy(Jfd_original, Jfd, DIFFERENT_NONZERO_PATTERN);
-          CHKERRQ(ierr);
-          // The non-zero pattern has changed, so update coloring
-          updateColoring();
-          jacobian_pruned = false; // Reset flag. Will be set after pruning.
-        }
         if (saved_jacobian_lag == 0) {
           SNESGetLagJacobian(snes, &saved_jacobian_lag);
           SNESSetLagJacobian(snes, 1);
@@ -944,24 +790,16 @@ int SNESSolver::run() {
         time1 = simtime;
       }
 
+      int nl_its;
+      SNESGetIterationNumber(snes, &nl_its);
+
       if (nl_its == 0) {
         // This can occur even with SNESSetForceIteration
         // Results in simulation state freezing and rapidly going to the end
 
-        if (scale_vars) {
-          // scaled_x <- snes_x * var_scaling_factors
-          ierr = VecPointwiseMult(scaled_x, snes_x, var_scaling_factors);
-          CHKERRQ(ierr);
-
-          const BoutReal* xdata = nullptr;
-          ierr = VecGetArrayRead(scaled_x, &xdata);
-          CHKERRQ(ierr);
-          load_vars(const_cast<BoutReal*>(xdata));
-          ierr = VecRestoreArrayRead(scaled_x, &xdata);
-          CHKERRQ(ierr);
-        } else {
+        {
           const BoutReal* xdata = nullptr;
-          ierr = VecGetArrayRead(snes_x, &xdata);
+          int ierr = VecGetArrayRead(snes_x, &xdata);
           CHKERRQ(ierr);
           load_vars(const_cast<BoutReal*>(xdata));
           ierr = VecRestoreArrayRead(snes_x, &xdata);
@@ -988,6 +826,9 @@ int SNESSolver::run() {
       if (diagnose) {
         // Gather and print diagnostic information
 
+        int lin_its;
+        SNESGetLinearSolveIterations(snes, &lin_its);
+
         output.print("\r"); // Carriage return for printing to screen
         output.write("Time: {}, timestep: {}, nl iter: {}, lin iter: {}, reason: {}",
                      simtime, timestep, nl_its, lin_its, static_cast<int>(reason));
@@ -998,51 +839,6 @@ int SNESSolver::run() {
         output.write("\n");
       }
 
-#if PETSC_VERSION_GE(3, 20, 0)
-      // MatFilter and MatEliminateZeros(Mat, bool) require PETSc >= 3.20
-      if (jacobian_recalculated and prune_jacobian) {
-        jacobian_recalculated = false; // Reset flag
-
-        // Remove small elements from the Jacobian and recompute the coloring
-        // Only do this if there are a significant number of small elements.
-        int small_elements = 0;
-        int total_elements = 0;
-
-        // Get index of rows owned by this processor
-        int rstart, rend;
-        MatGetOwnershipRange(Jfd, &rstart, &rend);
-
-        PetscInt ncols;
-        const PetscScalar* vals;
-        for (int row = rstart; row < rend; row++) {
-          MatGetRow(Jfd, row, &ncols, nullptr, &vals);
-          for (int col = 0; col < ncols; col++) {
-            if (std::abs(vals[col]) < prune_abstol) {
-              ++small_elements;
-            }
-            ++total_elements;
-          }
-          MatRestoreRow(Jfd, row, &ncols, nullptr, &vals);
-        }
-
-        if (small_elements > prune_fraction * total_elements) {
-          if (diagnose) {
-            output.write("\nPruning Jacobian elements: {} / {}\n", small_elements,
-                         total_elements);
-          }
-
-          // Prune Jacobian, keeping diagonal elements
-          ierr = MatFilter(Jfd, prune_abstol, PETSC_TRUE, PETSC_TRUE);
-
-          // Update the coloring from Jfd matrix
-          updateColoring();
-
-          // Mark the Jacobian as pruned. This is so that it is only restored if pruned.
-          jacobian_pruned = true;
-        }
-      }
-#endif // PETSC_VERSION_GE(3,20,0)
-
       if (looping) {
         if (nl_its <= lower_its) {
           // Increase timestep slightly
@@ -1059,18 +855,7 @@ int SNESSolver::run() {
     } while (looping);
 
     // Put the result into variables
-    if (scale_vars) {
-      // scaled_x <- snes_x * var_scaling_factors
-      int ierr = VecPointwiseMult(scaled_x, snes_x, var_scaling_factors);
-      CHKERRQ(ierr);
-
-      const BoutReal* xdata = nullptr;
-      ierr = VecGetArrayRead(scaled_x, &xdata);
-      CHKERRQ(ierr);
-      load_vars(const_cast<BoutReal*>(xdata));
-      ierr = VecRestoreArrayRead(scaled_x, &xdata);
-      CHKERRQ(ierr);
-    } else {
+    {
       const BoutReal* xdata = nullptr;
       int ierr = VecGetArrayRead(snes_x, &xdata);
       CHKERRQ(ierr);
@@ -1091,27 +876,12 @@ int SNESSolver::run() {
 // f = rhs
 PetscErrorCode SNESSolver::snes_function(Vec x, Vec f, bool linear) {
   // Get data from PETSc into BOUT++ fields
-  if (scale_vars) {
-    // scaled_x <- x * var_scaling_factors
-    int ierr = VecPointwiseMult(scaled_x, x, var_scaling_factors);
-    CHKERRQ(ierr);
-
-    const BoutReal* xdata = nullptr;
-    ierr = VecGetArrayRead(scaled_x, &xdata);
-    CHKERRQ(ierr);
-    load_vars(const_cast<BoutReal*>(
-        xdata)); // const_cast needed due to load_vars API. Not writing to xdata.
-    ierr = VecRestoreArrayRead(scaled_x, &xdata);
-    CHKERRQ(ierr);
-  } else {
-    const BoutReal* xdata = nullptr;
-    int ierr = VecGetArrayRead(x, &xdata);
-    CHKERRQ(ierr);
-    load_vars(const_cast<BoutReal*>(
-        xdata)); // const_cast needed due to load_vars API. Not writing to xdata.
-    ierr = VecRestoreArrayRead(x, &xdata);
-    CHKERRQ(ierr);
-  }
+  const BoutReal* xdata = nullptr;
+  int ierr = VecGetArrayRead(x, &xdata);
+  CHKERRQ(ierr);
+  load_vars(const_cast<BoutReal*>(xdata));
+  ierr = VecRestoreArrayRead(x, &xdata);
+  CHKERRQ(ierr);
 
   try {
     // Call RHS function
@@ -1129,7 +899,7 @@ PetscErrorCode SNESSolver::snes_function(Vec x, Vec f, bool linear) {
 
   // Copy derivatives back
   BoutReal* fdata = nullptr;
-  int ierr = VecGetArray(f, &fdata);
+  ierr = VecGetArray(f, &fdata);
   CHKERRQ(ierr);
   save_derivs(fdata);
   ierr = VecRestoreArray(f, &fdata);
@@ -1166,12 +936,6 @@ PetscErrorCode SNESSolver::snes_function(Vec x, Vec f, bool linear) {
   }
   };
 
-  if (scale_rhs) {
-    // f <- f * rhs_scaling_factors
-    ierr = VecPointwiseMult(f, f, rhs_scaling_factors);
-    CHKERRQ(ierr);
-  }
-
   return 0;
 }
 
@@ -1218,133 +982,4 @@ PetscErrorCode SNESSolver::precon(Vec x, Vec f) {
   return 0;
 }
 
-PetscErrorCode SNESSolver::scaleJacobian(Mat Jac_new) {
-  jacobian_recalculated = true;
-
-  if (!scale_rhs) {
-    return 0; // Not scaling the RHS values
-  }
-
-  int ierr;
-
-  // Get index of rows owned by this processor
-  int rstart, rend;
-  MatGetOwnershipRange(Jac_new, &rstart, &rend);
-
-  // Check that the vector has the same ownership range
-  int istart, iend;
-  VecGetOwnershipRange(jac_row_inv_norms, &istart, &iend);
-  if ((rstart != istart) or (rend != iend)) {
-    throw BoutException("Ownership ranges different: [{}, {}) and [{}, {})\n", rstart,
-                        rend, istart, iend);
-  }
-
-  // Calculate the norm of each row of the Jacobian
-  PetscScalar* row_inv_norm_data;
-  ierr = VecGetArray(jac_row_inv_norms, &row_inv_norm_data);
-  CHKERRQ(ierr);
-
-  PetscInt ncols;
-  const PetscScalar* vals;
-  for (int row = rstart; row < rend; ++row) {
-    MatGetRow(Jac_new, row, &ncols, nullptr, &vals);
-
-    // Calculate a norm of this row of the Jacobian
-    PetscScalar norm = 0.0;
-    for (int col = 0; col < ncols; col++) {
-      PetscScalar absval = std::abs(vals[col]);
-      if (absval > norm) {
-        norm = absval;
-      }
-      // Can we identify small elements and remove them?
-      // so we don't need to calculate them next time
-    }
-
-    // Store in the vector as 1 / norm
-    row_inv_norm_data[row - rstart] = 1. / norm;
-
-    MatRestoreRow(Jac_new, row, &ncols, nullptr, &vals);
-  }
-
-  ierr = VecRestoreArray(jac_row_inv_norms, &row_inv_norm_data);
-  CHKERRQ(ierr);
-
-  // Modify the RHS scaling: factor = factor / norm
-  ierr = VecPointwiseMult(rhs_scaling_factors, rhs_scaling_factors, jac_row_inv_norms);
-  CHKERRQ(ierr);
-
-  if (diagnose) {
-    // Print maximum and minimum scaling factors
-    PetscReal max_scale, min_scale;
-    VecMax(rhs_scaling_factors, nullptr, &max_scale);
-    VecMin(rhs_scaling_factors, nullptr, &min_scale);
-    output.write("RHS scaling: {} -> {}\n", min_scale, max_scale);
-  }
-
-  // Scale the Jacobian rows by multiplying on the left by 1/norm
-  ierr = MatDiagonalScale(Jac_new, jac_row_inv_norms, nullptr);
-  CHKERRQ(ierr);
-
-  return 0;
-}
-
-///
-/// Input Parameters:
-///   snes - nonlinear solver object
-///   x1 - location at which to evaluate Jacobian
-///   ctx - MatFDColoring context or NULL
-///
-/// Output Parameters:
-///   Jac - Jacobian matrix (not altered in this routine)
-///   Jac_new - newly computed Jacobian matrix to use with preconditioner (generally the same as
-///   Jac)
-static PetscErrorCode ComputeJacobianScaledColor(SNES snes, Vec x1, Mat Jac, Mat Jac_new,
-                                                 void* ctx) {
-  PetscErrorCode err = SNESComputeJacobianDefaultColor(snes, x1, Jac, Jac_new, ctx);
-  CHKERRQ(err);
-
-  if ((err != 0) or (ctx == nullptr)) {
-    return err;
-  }
-
-  // Get the the SNESSolver pointer from the function call context
-  SNESSolver* fctx = nullptr;
-  err = MatFDColoringGetFunction(static_cast<MatFDColoring>(ctx), nullptr,
-                                 reinterpret_cast<void**>(&fctx));
-  CHKERRQ(err);
-
-  // Call the SNESSolver function
-  return fctx->scaleJacobian(Jac_new);
-}
-
-void SNESSolver::updateColoring() {
-  // Re-calculate the coloring
-  MatColoring coloring = NULL;
-  MatColoringCreate(Jfd, &coloring);
-  MatColoringSetType(coloring, MATCOLORINGSL);
-  MatColoringSetFromOptions(coloring);
-
-  // Calculate new index sets
-  ISColoring iscoloring = NULL;
-  MatColoringApply(coloring, &iscoloring);
-  MatColoringDestroy(&coloring);
-
-  // Replace the old coloring with the new one
-  MatFDColoringDestroy(&fdcoloring);
-  MatFDColoringCreate(Jfd, iscoloring, &fdcoloring);
-  MatFDColoringSetFunction(
-      fdcoloring, reinterpret_cast<PetscErrorCode (*)()>(FormFunctionForColoring), this);
-  MatFDColoringSetFromOptions(fdcoloring);
-  MatFDColoringSetUp(Jfd, iscoloring, fdcoloring);
-  ISColoringDestroy(&iscoloring);
-
-  // Replace the CTX pointer in SNES Jacobian
-  if (matrix_free_operator) {
-    // Use matrix-free calculation for operator, finite difference for preconditioner
-    SNESSetJacobian(snes, Jmf, Jfd, ComputeJacobianScaledColor, fdcoloring);
-  } else {
-    SNESSetJacobian(snes, Jfd, Jfd, ComputeJacobianScaledColor, fdcoloring);
-  }
-}
-
 #endif // BOUT_HAS_PETSC

From 19ec182e965ecbea66d731a8c2218c148d84a8a8 Mon Sep 17 00:00:00 2001
From: Seimon Powell <seimon.powell@ukaea.uk>
Date: Thu, 24 Apr 2025 15:51:58 +0100
Subject: [PATCH 035/129] Change message to match rest of output

---
 src/solver/impls/snes/snes.cxx | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/solver/impls/snes/snes.cxx b/src/solver/impls/snes/snes.cxx
index aec986511f..176bcd9342 100644
--- a/src/solver/impls/snes/snes.cxx
+++ b/src/solver/impls/snes/snes.cxx
@@ -298,9 +298,9 @@ int SNESSolver::init() {
                          .doc("Extent of stencil (cross)")
                          .withDefault<int>(0);
       //Set n_taxi 2 if nothing else is set
-      //TODO: Probably a better way to do this
+      //Probably a better way to do this
       if (n_square == 0 && n_taxi == 0 && n_cross == 0) {
-        output_info.write("Setting beuler:stencil:taxi = 2\n");
+        output_info.write("Setting solver:stencil:taxi = 2\n");
         n_taxi = 2;
       }
 

From 697f729c723c4f7eec5fdb8336b0c5d9df6cae28 Mon Sep 17 00:00:00 2001
From: Seimon Powell <seimon.powell@ukaea.uk>
Date: Thu, 24 Apr 2025 16:01:01 +0100
Subject: [PATCH 036/129] Obey the naming conventions

---
 src/solver/impls/snes/snes.cxx | 39 +++++++++++++++++-----------------
 1 file changed, 20 insertions(+), 19 deletions(-)

diff --git a/src/solver/impls/snes/snes.cxx b/src/solver/impls/snes/snes.cxx
index 176bcd9342..67b6d75d54 100644
--- a/src/solver/impls/snes/snes.cxx
+++ b/src/solver/impls/snes/snes.cxx
@@ -18,10 +18,10 @@
 
 class ColoringStencil {
 private:
-  bool static in_compact(int const i, int const j, int const n_compact) {
-    return std::abs(i) <= n_compact && std::abs(j) <= n_compact;
+  bool static isInSquare(int const i, int const j, int const n_square) {
+    return std::abs(i) <= n_square && std::abs(j) <= n_square;
   }
-  bool static in_cross(int const i, int const j, int const n_cross) {
+  bool static isInCross(int const i, int const j, int const n_cross) {
     if (i == 0) {
       return std::abs(j) <= n_cross;
     }
@@ -30,28 +30,28 @@ class ColoringStencil {
     }
     return false;
   }
-  bool static in_taxi(int const i, int const j, int const n_taxi) {
+  bool static isInTaxi(int const i, int const j, int const n_taxi) {
     return std::abs(i) + std::abs(j) <= n_taxi;
   }
 
 public:
-  auto static get_offsets(int n_compact, int n_taxi, int n_cross) {
-    ASSERT2(n_compact >= 0 && n_cross >= 0 && n_taxi >= 0
-            && n_compact + n_cross + n_taxi > 0);
+  auto static getOffsets(int n_square, int n_taxi, int n_cross) {
+    ASSERT2(n_square >= 0 && n_cross >= 0 && n_taxi >= 0
+            && n_square + n_cross + n_taxi > 0);
     auto inside = [&](int i, int j) {
-      return in_compact(i, j, n_compact) || in_taxi(i, j, n_taxi)
-             || in_cross(i, j, n_cross);
+      return isInSquare(i, j, n_square) || isInTaxi(i, j, n_taxi)
+             || isInCross(i, j, n_cross);
     };
-    std::vector<std::pair<int, int>> xyoffset;
-    auto loop_bound = std::max({n_compact, n_taxi, n_cross});
+    std::vector<std::pair<int, int>> xy_offsets;
+    auto loop_bound = std::max({n_square, n_taxi, n_cross});
     for (int i = -loop_bound; i <= loop_bound; ++i) {
       for (int j = -loop_bound; j <= loop_bound; ++j) {
         if (inside(i, j)) {
-          xyoffset.emplace_back(i, j);
+          xy_offsets.emplace_back(i, j);
         }
       }
     }
-    return xyoffset;
+    return xy_offsets;
   }
 };
 
@@ -304,10 +304,11 @@ int SNESSolver::init() {
         n_taxi = 2;
       }
 
-      auto const xyoffsets = ColoringStencil::get_offsets(n_square, n_taxi, n_cross);
+      auto const xy_offsets = ColoringStencil::getOffsets(n_square, n_taxi, n_cross);
       {
-        //This is nasty but can't think of a better and robust way to
+        //This is ugly but can't think of a better and robust way to
         //count the non-zeros for some arbitery stencil
+        //effectivly the same loop as the one that sets the non-zeros below
         std::vector<std::set<int>> d_nnz_map2d(localN);
         std::vector<std::set<int>> o_nnz_map2d(localN);
         std::vector<std::set<int>> d_nnz_map3d(localN);
@@ -323,7 +324,7 @@ int SNESSolver::init() {
               PetscInt row = ind0 + i;
               //if (row < Istart || row >= Iend) continue;
               // Loop through each point in the stencil
-              for (const auto& [x_off, y_off] : xyoffsets) {
+              for (const auto& [x_off, y_off] : xy_offsets) {
                 int xi = x + x_off;
                 int yi = y + y_off;
                 if ((xi < 0) || (yi < 0) || (xi >= mesh->LocalNx)
@@ -369,7 +370,7 @@ int SNESSolver::init() {
                 }
 
                 // Star pattern
-                for (const auto& [x_off, y_off] : xyoffsets) {
+                for (const auto& [x_off, y_off] : xy_offsets) {
                   int xi = x + x_off;
                   int yi = y + y_off;
 
@@ -440,7 +441,7 @@ int SNESSolver::init() {
             PetscInt row = ind0 + i;
 
             // Loop through each point in the stencil
-            for (const auto& [x_off, y_off] : xyoffsets) {
+            for (const auto& [x_off, y_off] : xy_offsets) {
               int xi = x + x_off;
               int yi = y + y_off;
               if ((xi < 0) || (yi < 0) || (xi > mesh->LocalNx) || (yi > mesh->LocalNy)) {
@@ -478,7 +479,7 @@ int SNESSolver::init() {
               }
 
               // Star pattern
-              for (const auto& [x_off, y_off] : xyoffsets) {
+              for (const auto& [x_off, y_off] : xy_offsets) {
                 int xi = x + x_off;
                 int yi = y + y_off;
 

From 540ab7d39c0693fb9d5eebe9198a1d7b91ebdcac Mon Sep 17 00:00:00 2001
From: Ben Dudson <dudson2@llnl.gov>
Date: Thu, 24 Apr 2025 13:45:27 -0700
Subject: [PATCH 037/129] beuler: Merge improvements

PR #3009 included changes to allow matrix-free Jacobian-vector
products, while using the finite difference Jacobian for the
preconditioner. That gave significant speedups that will hopefully
also help now that the coloring stencil is fixed.
---
 src/solver/impls/snes/snes.cxx | 487 +++++++++++++++++++++++++++------
 1 file changed, 405 insertions(+), 82 deletions(-)

diff --git a/src/solver/impls/snes/snes.cxx b/src/solver/impls/snes/snes.cxx
index 67b6d75d54..61d98adafc 100644
--- a/src/solver/impls/snes/snes.cxx
+++ b/src/solver/impls/snes/snes.cxx
@@ -157,12 +157,31 @@ SNESSolver::SNESSolver(Options* opts)
       matrix_free((*options)["matrix_free"]
                       .doc("Use matrix free Jacobian?")
                       .withDefault<bool>(false)),
+      matrix_free_operator((*options)["matrix_free_operator"]
+                               .doc("Use matrix free Jacobian-vector operator?")
+                               .withDefault<bool>(true)),
       lag_jacobian((*options)["lag_jacobian"]
                        .doc("Re-use the Jacobian this number of SNES iterations")
                        .withDefault(50)),
       use_coloring((*options)["use_coloring"]
                        .doc("Use matrix coloring to calculate Jacobian?")
-                       .withDefault<bool>(true)) {}
+                       .withDefault<bool>(true)),
+      jacobian_recalculated(false),
+      prune_jacobian((*options)["prune_jacobian"]
+                         .doc("Remove small elements in the Jacobian?")
+                         .withDefault<bool>(false)),
+      prune_abstol((*options)["prune_abstol"]
+                       .doc("Prune values with absolute values smaller than this")
+                       .withDefault<BoutReal>(1e-16)),
+      prune_fraction((*options)["prune_fraction"]
+                         .doc("Prune if fraction of small elements is larger than this")
+                         .withDefault<BoutReal>(0.2)),
+      scale_rhs((*options)["scale_rhs"]
+                    .doc("Scale time derivatives (Jacobian row scaling)?")
+                    .withDefault<bool>(false)),
+      scale_vars((*options)["scale_vars"]
+                     .doc("Scale variables (Jacobian column scaling)?")
+                     .withDefault<bool>(false)) {}
 
 int SNESSolver::init() {
 
@@ -202,12 +221,38 @@ int SNESSolver::init() {
 
   if (equation_form == BoutSnesEquationForm::rearranged_backward_euler) {
     // Need an intermediate vector for rearranged Backward Euler
-    VecDuplicate(snes_x, &delta_x);
+    ierr = VecDuplicate(snes_x, &delta_x);
+    CHKERRQ(ierr);
   }
 
   if (predictor) {
     // Storage for previous solution
-    VecDuplicate(snes_x, &x1);
+    ierr = VecDuplicate(snes_x, &x1);
+    CHKERRQ(ierr);
+  }
+
+  if (scale_rhs) {
+    // Storage for rhs factors, one per evolving variable
+    ierr = VecDuplicate(snes_x, &rhs_scaling_factors);
+    CHKERRQ(ierr);
+    // Set all factors to 1 to start with
+    ierr = VecSet(rhs_scaling_factors, 1.0);
+    CHKERRQ(ierr);
+    // Array to store inverse Jacobian row norms
+    ierr = VecDuplicate(snes_x, &jac_row_inv_norms);
+    CHKERRQ(ierr);
+  }
+
+  if (scale_vars) {
+    // Storage for var factors, one per evolving variable
+    ierr = VecDuplicate(snes_x, &var_scaling_factors);
+    CHKERRQ(ierr);
+    // Set all factors to 1 to start with
+    ierr = VecSet(var_scaling_factors, 1.0);
+    CHKERRQ(ierr);
+    // Storage for scaled 'x' state vectors
+    ierr = VecDuplicate(snes_x, &scaled_x);
+    CHKERRQ(ierr);
   }
 
   // Nonlinear solver interface (SNES)
@@ -227,7 +272,7 @@ int SNESSolver::init() {
   }
 
   // Set up the Jacobian
-  if (matrix_free) {
+  if (matrix_free or matrix_free_operator) {
     /*
       PETSc SNES matrix free Jacobian, using a different
       operator for differencing.
@@ -243,12 +288,17 @@ int SNESSolver::init() {
     // Set a function to be called for differencing
     // This can be a linearised form of the SNES function
     MatMFFDSetFunction(Jmf, FormFunctionForDifferencing, this);
+  }
 
+  if (matrix_free) {
+    // Use matrix free for both operator and preconditioner
     // Calculate Jacobian matrix free using FormFunctionForDifferencing
     SNESSetJacobian(snes, Jmf, Jmf, MatMFFDComputeJacobian, this);
 
   } else {
-    // Calculate the Jacobian using finite differences
+    // Calculate the Jacobian using finite differences.
+    // The finite difference Jacobian (Jfd) may be used for both operator
+    // and preconditioner or, if matrix_free_operator, in only the preconditioner.
     if (use_coloring) {
       // Use matrix coloring
       // This greatly reduces the number of times the rhs() function needs
@@ -266,17 +316,16 @@ int SNESSolver::init() {
 
       output_progress.write("Setting Jacobian matrix sizes\n");
 
-      int localN = getLocalN(); // Number of rows on this processor
       int n2d = f2d.size();
       int n3d = f3d.size();
 
-      // Set size of Matrix on each processor to localN x localN
-      MatCreate(BoutComm::get(), &Jmf);
-      MatSetSizes(Jmf, localN, localN, PETSC_DETERMINE, PETSC_DETERMINE);
-      MatSetFromOptions(Jmf);
+      // Set size of Matrix on each processor to nlocal x nlocal
+      MatCreate(BoutComm::get(), &Jfd);
+      MatSetSizes(Jfd, nlocal, nlocal, PETSC_DETERMINE, PETSC_DETERMINE);
+      MatSetFromOptions(Jfd);
       // Determine which row/columns of the matrix are locally owned
       int Istart, Iend;
-      MatGetOwnershipRange(Jmf, &Istart, &Iend);
+      MatGetOwnershipRange(Jfd, &Istart, &Iend);
       // Convert local into global indices
       // Note: Not in the boundary cells, to keep -1 values
       for (const auto& i : mesh->getRegion3D("RGN_NOBNDRY")) {
@@ -309,10 +358,10 @@ int SNESSolver::init() {
         //This is ugly but can't think of a better and robust way to
         //count the non-zeros for some arbitery stencil
         //effectivly the same loop as the one that sets the non-zeros below
-        std::vector<std::set<int>> d_nnz_map2d(localN);
-        std::vector<std::set<int>> o_nnz_map2d(localN);
-        std::vector<std::set<int>> d_nnz_map3d(localN);
-        std::vector<std::set<int>> o_nnz_map3d(localN);
+        std::vector<std::set<int>> d_nnz_map2d(nlocal);
+        std::vector<std::set<int>> o_nnz_map2d(nlocal);
+        std::vector<std::set<int>> d_nnz_map3d(nlocal);
+        std::vector<std::set<int>> o_nnz_map3d(nlocal);
         //Loop over every element in 2D to count the *unique* non-zeros
         for (int x = mesh->xstart; x <= mesh->xend; x++) {
           for (int y = mesh->ystart; y <= mesh->yend; y++) {
@@ -403,10 +452,10 @@ int SNESSolver::init() {
           }
         }
 
-        d_nnz.reserve(localN);
-        d_nnz.reserve(localN);
+        d_nnz.reserve(nlocal);
+        d_nnz.reserve(nlocal);
 
-        for (int i = 0; i < localN; ++i) {
+        for (int i = 0; i < nlocal; ++i) {
           //Assume all elements in the z direction are potentially coupled
           d_nnz.emplace_back(d_nnz_map3d[i].size() * mesh->LocalNz
                              + d_nnz_map2d[i].size());
@@ -417,14 +466,10 @@ int SNESSolver::init() {
 
       output_progress.write("Pre-allocating Jacobian\n");
       // Pre-allocate
-      MatMPIAIJSetPreallocation(Jmf, 0, d_nnz.data(), 0, o_nnz.data());
-      MatSeqAIJSetPreallocation(Jmf, 0, d_nnz.data());
-      MatSetUp(Jmf);
-      MatSetOption(Jmf, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE);
-
-      //  // Determine which row/columns of the matrix are locally owned
-      //  int Istart, Iend;
-      //  MatGetOwnershipRange(Jmf, &Istart, &Iend);
+      MatMPIAIJSetPreallocation(Jfd, 0, d_nnz.data(), 0, o_nnz.data());
+      MatSeqAIJSetPreallocation(Jfd, 0, d_nnz.data());
+      MatSetUp(Jfd);
+      MatSetOption(Jfd, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE);
 
       //////////////////////////////////////////////////
       // Mark non-zero entries
@@ -456,7 +501,7 @@ int SNESSolver::init() {
               // Depends on all variables on this cell
               for (int j = 0; j < n2d; j++) {
                 PetscInt col = ind2 + j;
-                ierr = MatSetValues(Jmf, 1, &row, 1, &col, &val, INSERT_VALUES);
+                ierr = MatSetValues(Jfd, 1, &row, 1, &col, &val, INSERT_VALUES);
                 CHKERRQ(ierr);
               }
             }
@@ -474,7 +519,7 @@ int SNESSolver::init() {
               // Depends on 2D fields
               for (int j = 0; j < n2d; j++) {
                 PetscInt col = ind0 + j;
-                ierr = MatSetValues(Jmf, 1, &row, 1, &col, &val, INSERT_VALUES);
+                ierr = MatSetValues(Jfd, 1, &row, 1, &col, &val, INSERT_VALUES);
                 CHKERRQ(ierr);
               }
 
@@ -500,8 +545,7 @@ int SNESSolver::init() {
                   // 3D fields on this cell
                   for (int j = 0; j < n3d; j++) {
                     PetscInt col = ind2 + j;
-                    //printf("%d %d\n",row,col);
-                    ierr = MatSetValues(Jmf, 1, &row, 1, &col, &val, INSERT_VALUES);
+                    ierr = MatSetValues(Jfd, 1, &row, 1, &col, &val, INSERT_VALUES);
 
                     if (ierr != 0) {
                       output.write("ERROR: {} {} : ({}, {}) -> ({}, {}) : {} -> {}\n",
@@ -521,8 +565,8 @@ int SNESSolver::init() {
       output_progress.write("Assembling Jacobian matrix\n");
 
       // Assemble Matrix
-      MatAssemblyBegin(Jmf, MAT_FINAL_ASSEMBLY);
-      MatAssemblyEnd(Jmf, MAT_FINAL_ASSEMBLY);
+      MatAssemblyBegin(Jfd, MAT_FINAL_ASSEMBLY);
+      MatAssemblyEnd(Jfd, MAT_FINAL_ASSEMBLY);
 
       //The above will probably miss some non-zero entries at process boundaries
       //Making sure the colouring matrix is symmetric will in some/all(?)
@@ -530,36 +574,24 @@ int SNESSolver::init() {
       if ((*options)["force_symmetric_coloring"]
               .doc("Modifies coloring matrix to force it to be symmetric")
               .withDefault<bool>(false)) {
-        Mat Jmf_T;
-        MatCreateTranspose(Jmf, &Jmf_T);
-        MatAXPY(Jmf, 1, Jmf_T, DIFFERENT_NONZERO_PATTERN);
+        Mat Jfd_T;
+        MatCreateTranspose(Jfd, &Jfd_T);
+        MatAXPY(Jfd, 1, Jfd_T, DIFFERENT_NONZERO_PATTERN);
       }
 
       output_progress.write("Creating Jacobian coloring\n");
+      updateColoring();
 
-      ISColoring iscoloring;
-
-      MatColoring coloring; // This new in PETSc 3.5
-      MatColoringCreate(Jmf, &coloring);
-      MatColoringSetType(coloring, MATCOLORINGSL);
-      MatColoringSetFromOptions(coloring);
-      // Calculate index sets
-      MatColoringApply(coloring, &iscoloring);
-      MatColoringDestroy(&coloring);
-
-      // Create data structure for SNESComputeJacobianDefaultColor
-      MatFDColoringCreate(Jmf, iscoloring, &fdcoloring);
-      // Set the function to difference
-      MatFDColoringSetFunction(
-          fdcoloring, reinterpret_cast<PetscErrorCode (*)()>(FormFunctionForColoring),
-          this);
-      MatFDColoringSetFromOptions(fdcoloring);
-      MatFDColoringSetUp(Jmf, iscoloring, fdcoloring);
-      ISColoringDestroy(&iscoloring);
-
-      SNESSetJacobian(snes, Jmf, Jmf, SNESComputeJacobianDefaultColor, fdcoloring);
+      if (prune_jacobian) {
+        // Will remove small elements from the Jacobian.
+        // Save a copy to recover from over-pruning
+        ierr = MatDuplicate(Jfd, MAT_SHARE_NONZERO_PATTERN, &Jfd_original);
+        CHKERRQ(ierr);
+      }
     } else {
       // Brute force calculation
+      // There is usually no reason to use this, except as a check of
+      // the coloring calculation.
 
       MatCreateAIJ(
           BoutComm::get(), nlocal, nlocal,  // Local sizes
@@ -567,17 +599,20 @@ int SNESSolver::init() {
           3, // Number of nonzero entries in diagonal portion of local submatrix
           nullptr,
           0, // Number of nonzeros per row in off-diagonal portion of local submatrix
-          nullptr, &Jmf);
-#if PETSC_VERSION_GE(3, 4, 0)
-      SNESSetJacobian(snes, Jmf, Jmf, SNESComputeJacobianDefault, this);
-#else
-      // Before 3.4
-      SNESSetJacobian(snes, Jmf, Jmf, SNESDefaultComputeJacobian, this);
-#endif
-      MatSetOption(Jmf, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_FALSE);
+          nullptr, &Jfd);
+
+      if (matrix_free_operator) {
+        SNESSetJacobian(snes, Jmf, Jfd, SNESComputeJacobianDefault, this);
+      } else {
+        SNESSetJacobian(snes, Jfd, Jfd, SNESComputeJacobianDefault, this);
+      }
+
+      MatSetOption(Jfd, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_FALSE);
     }
 
     // Re-use Jacobian
+    // Note: If the 'Amat' Jacobian is matrix free, SNESComputeJacobian
+    //       always updates its reference 'u' vector every nonlinear iteration
     SNESSetLagJacobian(snes, lag_jacobian);
     // Set Jacobian and preconditioner to persist across time steps
     SNESSetLagJacobianPersists(snes, PETSC_TRUE);
@@ -588,8 +623,8 @@ int SNESSolver::init() {
   // Set tolerances
   SNESSetTolerances(snes, atol, rtol, stol, maxits, PETSC_DEFAULT);
 
-// Force SNES to take at least one nonlinear iteration.
-// This may prevent the solver from getting stuck in false steady state conditions
+  // Force SNES to take at least one nonlinear iteration.
+  // This may prevent the solver from getting stuck in false steady state conditions
 #if PETSC_VERSION_GE(3, 8, 0)
   SNESSetForceIteration(snes, PETSC_TRUE);
 #endif
@@ -671,6 +706,7 @@ int SNESSolver::init() {
 
 int SNESSolver::run() {
   TRACE("SNESSolver::run()");
+  int ierr;
   // Set initial guess at the solution from variables
   {
     BoutReal* xdata = nullptr;
@@ -687,7 +723,63 @@ int SNESSolver::run() {
     bool looping = true;
     int snes_failures = 0; // Count SNES convergence failures
     int saved_jacobian_lag = 0;
+    int loop_count = 0;
     do {
+      if (scale_vars) {
+        // Individual variable scaling
+        // Note: If variables are rescaled then the Jacobian columns
+        //       need to be scaled or recalculated
+
+        if (loop_count % 100 == 0) {
+          // Rescale state (snes_x) so that all quantities are around 1
+          // If quantities are near zero then RTOL is used
+          int istart, iend;
+          VecGetOwnershipRange(snes_x, &istart, &iend);
+
+          // Take ownership of snes_x and var_scaling_factors data
+          PetscScalar* snes_x_data = nullptr;
+          ierr = VecGetArray(snes_x, &snes_x_data);
+          CHKERRQ(ierr);
+          PetscScalar* x1_data;
+          ierr = VecGetArray(x1, &x1_data);
+          CHKERRQ(ierr);
+          PetscScalar* var_scaling_factors_data;
+          ierr = VecGetArray(var_scaling_factors, &var_scaling_factors_data);
+          CHKERRQ(ierr);
+
+          // Normalise each value in the state
+          // Limit normalisation so scaling factor is never smaller than rtol
+          for (int i = 0; i < iend - istart; ++i) {
+            const PetscScalar norm =
+                BOUTMAX(std::abs(snes_x_data[i]), rtol / var_scaling_factors_data[i]);
+            snes_x_data[i] /= norm;
+            x1_data[i] /= norm; // Update history for predictor
+            var_scaling_factors_data[i] *= norm;
+          }
+
+          // Restore vector underlying data
+          ierr = VecRestoreArray(var_scaling_factors, &var_scaling_factors_data);
+          CHKERRQ(ierr);
+          ierr = VecRestoreArray(x1, &x1_data);
+          CHKERRQ(ierr);
+          ierr = VecRestoreArray(snes_x, &snes_x_data);
+          CHKERRQ(ierr);
+
+          if (diagnose) {
+            // Print maximum and minimum scaling factors
+            PetscReal max_scale, min_scale;
+            VecMax(var_scaling_factors, nullptr, &max_scale);
+            VecMin(var_scaling_factors, nullptr, &min_scale);
+            output.write("Var scaling: {} -> {}\n", min_scale, max_scale);
+          }
+
+          // Force recalculation of the Jacobian
+          SNESGetLagJacobian(snes, &saved_jacobian_lag);
+          SNESSetLagJacobian(snes, 1);
+        }
+      }
+      ++loop_count;
+
       // Copy the state (snes_x) into initial values (x0)
       VecCopy(snes_x, x0);
 
@@ -729,6 +821,13 @@ int SNESSolver::run() {
       // Find out if converged
       SNESConvergedReason reason;
       SNESGetConvergedReason(snes, &reason);
+
+      // Get number of iterations
+      int nl_its;
+      SNESGetIterationNumber(snes, &nl_its);
+      int lin_its;
+      SNESGetLinearSolveIterations(snes, &lin_its);
+
       if ((ierr != 0) or (reason < 0)) {
         // Diverged or SNES failed
 
@@ -759,6 +858,19 @@ int SNESSolver::run() {
         VecCopy(x0, snes_x);
 
         // Recalculate the Jacobian
+        if (jacobian_pruned and (snes_failures > 2) and (4 * lin_its > 3 * maxl)) {
+          // Taking 3/4 of maximum linear iterations on average per linear step
+          // May indicate a preconditioner problem.
+          // Restore pruned non-zero elements
+          if (diagnose) {
+            output.write("\nRestoring Jacobian\n");
+          }
+          ierr = MatCopy(Jfd_original, Jfd, DIFFERENT_NONZERO_PATTERN);
+          CHKERRQ(ierr);
+          // The non-zero pattern has changed, so update coloring
+          updateColoring();
+          jacobian_pruned = false; // Reset flag. Will be set after pruning.
+        }
         if (saved_jacobian_lag == 0) {
           SNESGetLagJacobian(snes, &saved_jacobian_lag);
           SNESSetLagJacobian(snes, 1);
@@ -791,16 +903,24 @@ int SNESSolver::run() {
         time1 = simtime;
       }
 
-      int nl_its;
-      SNESGetIterationNumber(snes, &nl_its);
-
       if (nl_its == 0) {
         // This can occur even with SNESSetForceIteration
         // Results in simulation state freezing and rapidly going to the end
 
-        {
+        if (scale_vars) {
+          // scaled_x <- snes_x * var_scaling_factors
+          ierr = VecPointwiseMult(scaled_x, snes_x, var_scaling_factors);
+          CHKERRQ(ierr);
+
+          const BoutReal* xdata = nullptr;
+          ierr = VecGetArrayRead(scaled_x, &xdata);
+          CHKERRQ(ierr);
+          load_vars(const_cast<BoutReal*>(xdata));
+          ierr = VecRestoreArrayRead(scaled_x, &xdata);
+          CHKERRQ(ierr);
+        } else {
           const BoutReal* xdata = nullptr;
-          int ierr = VecGetArrayRead(snes_x, &xdata);
+          ierr = VecGetArrayRead(snes_x, &xdata);
           CHKERRQ(ierr);
           load_vars(const_cast<BoutReal*>(xdata));
           ierr = VecRestoreArrayRead(snes_x, &xdata);
@@ -827,9 +947,6 @@ int SNESSolver::run() {
       if (diagnose) {
         // Gather and print diagnostic information
 
-        int lin_its;
-        SNESGetLinearSolveIterations(snes, &lin_its);
-
         output.print("\r"); // Carriage return for printing to screen
         output.write("Time: {}, timestep: {}, nl iter: {}, lin iter: {}, reason: {}",
                      simtime, timestep, nl_its, lin_its, static_cast<int>(reason));
@@ -840,6 +957,51 @@ int SNESSolver::run() {
         output.write("\n");
       }
 
+#if PETSC_VERSION_GE(3, 20, 0)
+      // MatFilter and MatEliminateZeros(Mat, bool) require PETSc >= 3.20
+      if (jacobian_recalculated and prune_jacobian) {
+        jacobian_recalculated = false; // Reset flag
+
+        // Remove small elements from the Jacobian and recompute the coloring
+        // Only do this if there are a significant number of small elements.
+        int small_elements = 0;
+        int total_elements = 0;
+
+        // Get index of rows owned by this processor
+        int rstart, rend;
+        MatGetOwnershipRange(Jfd, &rstart, &rend);
+
+        PetscInt ncols;
+        const PetscScalar* vals;
+        for (int row = rstart; row < rend; row++) {
+          MatGetRow(Jfd, row, &ncols, nullptr, &vals);
+          for (int col = 0; col < ncols; col++) {
+            if (std::abs(vals[col]) < prune_abstol) {
+              ++small_elements;
+            }
+            ++total_elements;
+          }
+          MatRestoreRow(Jfd, row, &ncols, nullptr, &vals);
+        }
+
+        if (small_elements > prune_fraction * total_elements) {
+          if (diagnose) {
+            output.write("\nPruning Jacobian elements: {} / {}\n", small_elements,
+                         total_elements);
+          }
+
+          // Prune Jacobian, keeping diagonal elements
+          ierr = MatFilter(Jfd, prune_abstol, PETSC_TRUE, PETSC_TRUE);
+
+          // Update the coloring from Jfd matrix
+          updateColoring();
+
+          // Mark the Jacobian as pruned. This is so that it is only restored if pruned.
+          jacobian_pruned = true;
+        }
+      }
+#endif // PETSC_VERSION_GE(3,20,0)
+
       if (looping) {
         if (nl_its <= lower_its) {
           // Increase timestep slightly
@@ -856,7 +1018,18 @@ int SNESSolver::run() {
     } while (looping);
 
     // Put the result into variables
-    {
+    if (scale_vars) {
+      // scaled_x <- snes_x * var_scaling_factors
+      int ierr = VecPointwiseMult(scaled_x, snes_x, var_scaling_factors);
+      CHKERRQ(ierr);
+
+      const BoutReal* xdata = nullptr;
+      ierr = VecGetArrayRead(scaled_x, &xdata);
+      CHKERRQ(ierr);
+      load_vars(const_cast<BoutReal*>(xdata));
+      ierr = VecRestoreArrayRead(scaled_x, &xdata);
+      CHKERRQ(ierr);
+    } else {
       const BoutReal* xdata = nullptr;
       int ierr = VecGetArrayRead(snes_x, &xdata);
       CHKERRQ(ierr);
@@ -877,12 +1050,27 @@ int SNESSolver::run() {
 // f = rhs
 PetscErrorCode SNESSolver::snes_function(Vec x, Vec f, bool linear) {
   // Get data from PETSc into BOUT++ fields
-  const BoutReal* xdata = nullptr;
-  int ierr = VecGetArrayRead(x, &xdata);
-  CHKERRQ(ierr);
-  load_vars(const_cast<BoutReal*>(xdata));
-  ierr = VecRestoreArrayRead(x, &xdata);
-  CHKERRQ(ierr);
+  if (scale_vars) {
+    // scaled_x <- x * var_scaling_factors
+    int ierr = VecPointwiseMult(scaled_x, x, var_scaling_factors);
+    CHKERRQ(ierr);
+
+    const BoutReal* xdata = nullptr;
+    ierr = VecGetArrayRead(scaled_x, &xdata);
+    CHKERRQ(ierr);
+    load_vars(const_cast<BoutReal*>(
+        xdata)); // const_cast needed due to load_vars API. Not writing to xdata.
+    ierr = VecRestoreArrayRead(scaled_x, &xdata);
+    CHKERRQ(ierr);
+  } else {
+    const BoutReal* xdata = nullptr;
+    int ierr = VecGetArrayRead(x, &xdata);
+    CHKERRQ(ierr);
+    load_vars(const_cast<BoutReal*>(
+        xdata)); // const_cast needed due to load_vars API. Not writing to xdata.
+    ierr = VecRestoreArrayRead(x, &xdata);
+    CHKERRQ(ierr);
+  }
 
   try {
     // Call RHS function
@@ -900,7 +1088,7 @@ PetscErrorCode SNESSolver::snes_function(Vec x, Vec f, bool linear) {
 
   // Copy derivatives back
   BoutReal* fdata = nullptr;
-  ierr = VecGetArray(f, &fdata);
+  int ierr = VecGetArray(f, &fdata);
   CHKERRQ(ierr);
   save_derivs(fdata);
   ierr = VecRestoreArray(f, &fdata);
@@ -937,6 +1125,12 @@ PetscErrorCode SNESSolver::snes_function(Vec x, Vec f, bool linear) {
   }
   };
 
+  if (scale_rhs) {
+    // f <- f * rhs_scaling_factors
+    ierr = VecPointwiseMult(f, f, rhs_scaling_factors);
+    CHKERRQ(ierr);
+  }
+
   return 0;
 }
 
@@ -983,4 +1177,133 @@ PetscErrorCode SNESSolver::precon(Vec x, Vec f) {
   return 0;
 }
 
+PetscErrorCode SNESSolver::scaleJacobian(Mat Jac_new) {
+  jacobian_recalculated = true;
+
+  if (!scale_rhs) {
+    return 0; // Not scaling the RHS values
+  }
+
+  int ierr;
+
+  // Get index of rows owned by this processor
+  int rstart, rend;
+  MatGetOwnershipRange(Jac_new, &rstart, &rend);
+
+  // Check that the vector has the same ownership range
+  int istart, iend;
+  VecGetOwnershipRange(jac_row_inv_norms, &istart, &iend);
+  if ((rstart != istart) or (rend != iend)) {
+    throw BoutException("Ownership ranges different: [{}, {}) and [{}, {})\n", rstart,
+                        rend, istart, iend);
+  }
+
+  // Calculate the norm of each row of the Jacobian
+  PetscScalar* row_inv_norm_data;
+  ierr = VecGetArray(jac_row_inv_norms, &row_inv_norm_data);
+  CHKERRQ(ierr);
+
+  PetscInt ncols;
+  const PetscScalar* vals;
+  for (int row = rstart; row < rend; ++row) {
+    MatGetRow(Jac_new, row, &ncols, nullptr, &vals);
+
+    // Calculate a norm of this row of the Jacobian
+    PetscScalar norm = 0.0;
+    for (int col = 0; col < ncols; col++) {
+      PetscScalar absval = std::abs(vals[col]);
+      if (absval > norm) {
+        norm = absval;
+      }
+      // Can we identify small elements and remove them?
+      // so we don't need to calculate them next time
+    }
+
+    // Store in the vector as 1 / norm
+    row_inv_norm_data[row - rstart] = 1. / norm;
+
+    MatRestoreRow(Jac_new, row, &ncols, nullptr, &vals);
+  }
+
+  ierr = VecRestoreArray(jac_row_inv_norms, &row_inv_norm_data);
+  CHKERRQ(ierr);
+
+  // Modify the RHS scaling: factor = factor / norm
+  ierr = VecPointwiseMult(rhs_scaling_factors, rhs_scaling_factors, jac_row_inv_norms);
+  CHKERRQ(ierr);
+
+  if (diagnose) {
+    // Print maximum and minimum scaling factors
+    PetscReal max_scale, min_scale;
+    VecMax(rhs_scaling_factors, nullptr, &max_scale);
+    VecMin(rhs_scaling_factors, nullptr, &min_scale);
+    output.write("RHS scaling: {} -> {}\n", min_scale, max_scale);
+  }
+
+  // Scale the Jacobian rows by multiplying on the left by 1/norm
+  ierr = MatDiagonalScale(Jac_new, jac_row_inv_norms, nullptr);
+  CHKERRQ(ierr);
+
+  return 0;
+}
+
+///
+/// Input Parameters:
+///   snes - nonlinear solver object
+///   x1 - location at which to evaluate Jacobian
+///   ctx - MatFDColoring context or NULL
+///
+/// Output Parameters:
+///   Jac - Jacobian matrix (not altered in this routine)
+///   Jac_new - newly computed Jacobian matrix to use with preconditioner (generally the same as
+///   Jac)
+static PetscErrorCode ComputeJacobianScaledColor(SNES snes, Vec x1, Mat Jac, Mat Jac_new,
+                                                 void* ctx) {
+  PetscErrorCode err = SNESComputeJacobianDefaultColor(snes, x1, Jac, Jac_new, ctx);
+  CHKERRQ(err);
+
+  if ((err != 0) or (ctx == nullptr)) {
+    return err;
+  }
+
+  // Get the the SNESSolver pointer from the function call context
+  SNESSolver* fctx = nullptr;
+  err = MatFDColoringGetFunction(static_cast<MatFDColoring>(ctx), nullptr,
+                                 reinterpret_cast<void**>(&fctx));
+  CHKERRQ(err);
+
+  // Call the SNESSolver function
+  return fctx->scaleJacobian(Jac_new);
+}
+
+void SNESSolver::updateColoring() {
+  // Re-calculate the coloring
+  MatColoring coloring = NULL;
+  MatColoringCreate(Jfd, &coloring);
+  MatColoringSetType(coloring, MATCOLORINGSL);
+  MatColoringSetFromOptions(coloring);
+
+  // Calculate new index sets
+  ISColoring iscoloring = NULL;
+  MatColoringApply(coloring, &iscoloring);
+  MatColoringDestroy(&coloring);
+
+  // Replace the old coloring with the new one
+  MatFDColoringDestroy(&fdcoloring);
+  MatFDColoringCreate(Jfd, iscoloring, &fdcoloring);
+  MatFDColoringSetFunction(
+      fdcoloring, reinterpret_cast<PetscErrorCode (*)()>(FormFunctionForColoring), this);
+  MatFDColoringSetFromOptions(fdcoloring);
+  MatFDColoringSetUp(Jfd, iscoloring, fdcoloring);
+  ISColoringDestroy(&iscoloring);
+
+  // Replace the CTX pointer in SNES Jacobian
+  if (matrix_free_operator) {
+    // Use matrix-free calculation for operator, finite difference for preconditioner
+    SNESSetJacobian(snes, Jmf, Jfd, ComputeJacobianScaledColor, fdcoloring);
+  } else {
+    SNESSetJacobian(snes, Jfd, Jfd, ComputeJacobianScaledColor, fdcoloring);
+  }
+}
+
 #endif // BOUT_HAS_PETSC

From aed011fd2d65db38992b3e59ac7ccf61f16e51b7 Mon Sep 17 00:00:00 2001
From: Ben Dudson <dudson2@llnl.gov>
Date: Thu, 24 Apr 2025 15:53:26 -0700
Subject: [PATCH 038/129] beuler: Limit stencil to fit in guard cells

If the stencil offset exceeds MXG in X, or MYG in Y, then
the index offsets will go outside the range of the guard cells.

Fixes failure of test-beuler
---
 src/solver/impls/snes/snes.cxx | 8 ++++++--
 1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/src/solver/impls/snes/snes.cxx b/src/solver/impls/snes/snes.cxx
index 61d98adafc..024d5fbd08 100644
--- a/src/solver/impls/snes/snes.cxx
+++ b/src/solver/impls/snes/snes.cxx
@@ -6,6 +6,7 @@
 
 #include <bout/boutcomm.hxx>
 #include <bout/boutexception.hxx>
+#include <bout/globals.hxx>
 #include <bout/msg_stack.hxx>
 #include <bout/utils.hxx>
 
@@ -44,8 +45,11 @@ class ColoringStencil {
     };
     std::vector<std::pair<int, int>> xy_offsets;
     auto loop_bound = std::max({n_square, n_taxi, n_cross});
-    for (int i = -loop_bound; i <= loop_bound; ++i) {
-      for (int j = -loop_bound; j <= loop_bound; ++j) {
+    // Ensure that stencil does not go beyond guard cells
+    auto loop_bound_x = std::min({loop_bound, bout::globals::mesh->xstart});
+    auto loop_bound_y = std::min({loop_bound, bout::globals::mesh->ystart});
+    for (int i = -loop_bound_x; i <= loop_bound_x; ++i) {
+      for (int j = -loop_bound_y; j <= loop_bound_y; ++j) {
         if (inside(i, j)) {
           xy_offsets.emplace_back(i, j);
         }

From c94150e35d689bddf92e6f3f43162e5dcd35e161 Mon Sep 17 00:00:00 2001
From: Ben Dudson <dudson2@llnl.gov>
Date: Thu, 24 Apr 2025 16:19:38 -0700
Subject: [PATCH 039/129] beuler: Fix limits on indices

Revert earlier change to offset array. Instead fix index limits
to be < LocalNx.
---
 src/solver/impls/snes/snes.cxx | 57 ++++++++++++++++------------------
 1 file changed, 26 insertions(+), 31 deletions(-)

diff --git a/src/solver/impls/snes/snes.cxx b/src/solver/impls/snes/snes.cxx
index 024d5fbd08..90e7c5085a 100644
--- a/src/solver/impls/snes/snes.cxx
+++ b/src/solver/impls/snes/snes.cxx
@@ -45,11 +45,8 @@ class ColoringStencil {
     };
     std::vector<std::pair<int, int>> xy_offsets;
     auto loop_bound = std::max({n_square, n_taxi, n_cross});
-    // Ensure that stencil does not go beyond guard cells
-    auto loop_bound_x = std::min({loop_bound, bout::globals::mesh->xstart});
-    auto loop_bound_y = std::min({loop_bound, bout::globals::mesh->ystart});
-    for (int i = -loop_bound_x; i <= loop_bound_x; ++i) {
-      for (int j = -loop_bound_y; j <= loop_bound_y; ++j) {
+    for (int i = -loop_bound; i <= loop_bound; ++i) {
+      for (int j = -loop_bound; j <= loop_bound; ++j) {
         if (inside(i, j)) {
           xy_offsets.emplace_back(i, j);
         }
@@ -320,8 +317,8 @@ int SNESSolver::init() {
 
       output_progress.write("Setting Jacobian matrix sizes\n");
 
-      int n2d = f2d.size();
-      int n3d = f3d.size();
+      const int n2d = f2d.size();
+      const int n3d = f3d.size();
 
       // Set size of Matrix on each processor to nlocal x nlocal
       MatCreate(BoutComm::get(), &Jfd);
@@ -359,40 +356,39 @@ int SNESSolver::init() {
 
       auto const xy_offsets = ColoringStencil::getOffsets(n_square, n_taxi, n_cross);
       {
-        //This is ugly but can't think of a better and robust way to
-        //count the non-zeros for some arbitery stencil
-        //effectivly the same loop as the one that sets the non-zeros below
+        // This is ugly but can't think of a better and robust way to
+        // count the non-zeros for some arbitrary stencil
+        // effectively the same loop as the one that sets the non-zeros below
         std::vector<std::set<int>> d_nnz_map2d(nlocal);
         std::vector<std::set<int>> o_nnz_map2d(nlocal);
         std::vector<std::set<int>> d_nnz_map3d(nlocal);
         std::vector<std::set<int>> o_nnz_map3d(nlocal);
-        //Loop over every element in 2D to count the *unique* non-zeros
+        // Loop over every element in 2D to count the *unique* non-zeros
         for (int x = mesh->xstart; x <= mesh->xend; x++) {
           for (int y = mesh->ystart; y <= mesh->yend; y++) {
 
-            int ind0 = ROUND(index(x, y, 0)) - Istart;
+            const int ind0 = ROUND(index(x, y, 0)) - Istart;
 
             // 2D fields
             for (int i = 0; i < n2d; i++) {
-              PetscInt row = ind0 + i;
-              //if (row < Istart || row >= Iend) continue;
+              const PetscInt row = ind0 + i;
               // Loop through each point in the stencil
               for (const auto& [x_off, y_off] : xy_offsets) {
-                int xi = x + x_off;
-                int yi = y + y_off;
+                const int xi = x + x_off;
+                const int yi = y + y_off;
                 if ((xi < 0) || (yi < 0) || (xi >= mesh->LocalNx)
                     || (yi >= mesh->LocalNy)) {
                   continue;
                 }
 
-                int ind2 = ROUND(index(xi, yi, 0));
+                const int ind2 = ROUND(index(xi, yi, 0));
                 if (ind2 < 0) {
                   continue; // A boundary point
                 }
 
                 // Depends on all variables on this cell
                 for (int j = 0; j < n2d; j++) {
-                  PetscInt col = ind2 + j;
+                  const PetscInt col = ind2 + j;
                   if (col >= Istart && col < Iend) {
                     d_nnz_map2d[row].insert(col);
                   } else {
@@ -403,18 +399,17 @@ int SNESSolver::init() {
             }
             // 3D fields
             for (int z = 0; z < mesh->LocalNz; z++) {
-              int ind = ROUND(index(x, y, z)) - Istart;
+              const int ind = ROUND(index(x, y, z)) - Istart;
 
               for (int i = 0; i < n3d; i++) {
                 PetscInt row = ind + i;
-                //if (row < Istart || row >= Iend) continue;
                 if (z == 0) {
                   row += n2d;
                 }
 
                 // Depends on 2D fields
                 for (int j = 0; j < n2d; j++) {
-                  PetscInt col = ind0 + j;
+                  const PetscInt col = ind0 + j;
                   if (col >= Istart && col < Iend) {
                     d_nnz_map2d[row].insert(col);
                   } else {
@@ -424,11 +419,11 @@ int SNESSolver::init() {
 
                 // Star pattern
                 for (const auto& [x_off, y_off] : xy_offsets) {
-                  int xi = x + x_off;
-                  int yi = y + y_off;
+                  const int xi = x + x_off;
+                  const int yi = y + y_off;
 
-                  if ((xi < 0) || (yi < 0) || (xi > mesh->LocalNx)
-                      || (yi > mesh->LocalNy)) {
+                  if ((xi < 0) || (yi < 0) || (xi >= mesh->LocalNx)
+                      || (yi >= mesh->LocalNy)) {
                     continue;
                   }
 
@@ -443,7 +438,7 @@ int SNESSolver::init() {
 
                   // 3D fields on this cell
                   for (int j = 0; j < n3d; j++) {
-                    PetscInt col = ind2 + j;
+                    const PetscInt col = ind2 + j;
                     if (col >= Istart && col < Iend) {
                       d_nnz_map3d[row].insert(col);
                     } else {
@@ -483,17 +478,17 @@ int SNESSolver::init() {
       for (int x = mesh->xstart; x <= mesh->xend; x++) {
         for (int y = mesh->ystart; y <= mesh->yend; y++) {
 
-          int ind0 = ROUND(index(x, y, 0));
+          const int ind0 = ROUND(index(x, y, 0));
 
           // 2D fields
           for (int i = 0; i < n2d; i++) {
-            PetscInt row = ind0 + i;
+            const PetscInt row = ind0 + i;
 
             // Loop through each point in the stencil
             for (const auto& [x_off, y_off] : xy_offsets) {
-              int xi = x + x_off;
-              int yi = y + y_off;
-              if ((xi < 0) || (yi < 0) || (xi > mesh->LocalNx) || (yi > mesh->LocalNy)) {
+              const int xi = x + x_off;
+              const int yi = y + y_off;
+              if ((xi < 0) || (yi < 0) || (xi >= mesh->LocalNx) || (yi >= mesh->LocalNy)) {
                 continue;
               }
 

From 56298f02cc8709efe8106a98db14e335456dc2cf Mon Sep 17 00:00:00 2001
From: Ben Dudson <dudson2@llnl.gov>
Date: Thu, 24 Apr 2025 16:51:41 -0700
Subject: [PATCH 040/129] beuler: Apply clang-format

---
 src/solver/impls/snes/snes.cxx | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/solver/impls/snes/snes.cxx b/src/solver/impls/snes/snes.cxx
index 90e7c5085a..a7f2d36d8a 100644
--- a/src/solver/impls/snes/snes.cxx
+++ b/src/solver/impls/snes/snes.cxx
@@ -488,7 +488,8 @@ int SNESSolver::init() {
             for (const auto& [x_off, y_off] : xy_offsets) {
               const int xi = x + x_off;
               const int yi = y + y_off;
-              if ((xi < 0) || (yi < 0) || (xi >= mesh->LocalNx) || (yi >= mesh->LocalNy)) {
+              if ((xi < 0) || (yi < 0) || (xi >= mesh->LocalNx)
+                  || (yi >= mesh->LocalNy)) {
                 continue;
               }
 

From 348e65b9e2a09e2090cf209cc0eca07a4b1cfd40 Mon Sep 17 00:00:00 2001
From: Ben Dudson <dudson2@llnl.gov>
Date: Sat, 26 Apr 2025 14:21:43 -0700
Subject: [PATCH 041/129] beuler: Disable matrix_free_operator by default

This uses a matrix-free method to calculate Jacobian-vector products.
It seems to improve performance in 1D, but degrades performance in 2D.
Effect likely problem dependent.
---
 src/solver/impls/snes/snes.cxx | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/solver/impls/snes/snes.cxx b/src/solver/impls/snes/snes.cxx
index a7f2d36d8a..4dce1e7086 100644
--- a/src/solver/impls/snes/snes.cxx
+++ b/src/solver/impls/snes/snes.cxx
@@ -160,7 +160,7 @@ SNESSolver::SNESSolver(Options* opts)
                       .withDefault<bool>(false)),
       matrix_free_operator((*options)["matrix_free_operator"]
                                .doc("Use matrix free Jacobian-vector operator?")
-                               .withDefault<bool>(true)),
+                               .withDefault<bool>(false)),
       lag_jacobian((*options)["lag_jacobian"]
                        .doc("Re-use the Jacobian this number of SNES iterations")
                        .withDefault(50)),

From ea7695a48de5a1268fa54780c592b01be0271705 Mon Sep 17 00:00:00 2001
From: Ben Dudson <dudson2@llnl.gov>
Date: Sat, 26 Apr 2025 22:37:52 -0700
Subject: [PATCH 042/129] snes: Add documentation to manual

Using @seimtpow's PR comments to add material to the manual.
---
 manual/sphinx/user_docs/time_integration.rst | 58 +++++++++++++++++++-
 1 file changed, 56 insertions(+), 2 deletions(-)

diff --git a/manual/sphinx/user_docs/time_integration.rst b/manual/sphinx/user_docs/time_integration.rst
index 7d0b56abcc..a4db823369 100644
--- a/manual/sphinx/user_docs/time_integration.rst
+++ b/manual/sphinx/user_docs/time_integration.rst
@@ -393,7 +393,9 @@ iterations within a given range.
 +---------------------------+---------------+----------------------------------------------------+
 | predictor                 | true          | Use linear predictor?                              |
 +---------------------------+---------------+----------------------------------------------------+
-| matrix_free               | false         | Use matrix free Jacobian-vector product?           |
+| matrix_free               | false         | Matrix-free preconditioning?                       |
++---------------------------+---------------+----------------------------------------------------+
+| matrix_free_operator      | false         | Use matrix free Jacobian-vector product?           |
 +---------------------------+---------------+----------------------------------------------------+
 | use_coloring              | true          | If ``matrix_free=false``, use coloring to speed up |
 |                           |               | calculation of the Jacobian elements.              |
@@ -402,11 +404,18 @@ iterations within a given range.
 +---------------------------+---------------+----------------------------------------------------+
 | kspsetinitialguessnonzero | false         | If true, Use previous solution as KSP initial      |
 +---------------------------+---------------+----------------------------------------------------+
-| use_precon                | false         | Use user-supplied preconditioner?                  |
+| use_precon                | false         | If ``matrix_free=true``, use user-supplied         |
+|                           |               | preconditioner?                                    |
 |                           |               | If false, the default PETSc preconditioner is used |
 +---------------------------+---------------+----------------------------------------------------+
 | diagnose                  | false         | Print diagnostic information every iteration       |
 +---------------------------+---------------+----------------------------------------------------+
+| stencil:cross             | 0             | If ``matrix_free=false`` and ``use_coloring=true`` |
+| stencil:square            | 0             | Set the size and shape of the Jacobian coloring    |
+| stencil:taxi              | 2             | stencil.                                           |
++---------------------------+---------------+----------------------------------------------------+
+| force_symmetric_coloring  | false         | Ensure that the Jacobian coloring is symmetric     |
++---------------------------+---------------+----------------------------------------------------+
 
 The predictor is linear extrapolation from the last two timesteps. It seems to be
 effective, but can be disabled by setting ``predictor = false``.
@@ -444,6 +453,51 @@ Preconditioner types:
    Enable with command-line args ``-pc_type hypre -pc_hypre_type euclid -pc_hypre_euclid_levels k``
    where ``k`` is the level (1-8 typically).
 
+Jacobian coloring stencil
+~~~~~~~~~~~~~~~~~~~~~~~~~
+
+The stencil used to create the Jacobian colouring can be varied,
+depending on which numerical operators are in use.
+
+
+``solver:stencil:cross = N``
+e.g. for N == 2
+
+.. code-block:: bash
+
+        *
+        *
+    * * x * *
+        *
+        *
+
+
+``solver:stencil:square = N``
+e.g. for N == 2
+
+.. code-block:: bash
+
+    * * * * *
+    * * * * *
+    * * x * *
+    * * * * *
+    * * * * *
+
+``solver:stencil:taxi = N``
+e.g. for N == 2
+
+.. code-block:: bash
+
+        *
+      * * *
+    * * x * *
+      * * *
+        *
+
+Setting ``solver:force_symmetric_coloring = true``, will make sure
+that the jacobian colouring matrix is symmetric.  This will often
+include a few extra non-zeros that the stencil will miss otherwise
+
 ODE integration
 ---------------
 

From 9fba0611fac9c6596c643dd2c49904ef4c4dfbd4 Mon Sep 17 00:00:00 2001
From: tomc271 <tomc271@gmail.com>
Date: Mon, 28 Apr 2025 13:17:52 +0100
Subject: [PATCH 043/129] Add
 TokamakOptions::CylindricalCoordinatesToCartesian()

method for converting to cartesian coordinates from cylindrical coordinates.

Add new struct Coordinates3D, to encapsulate (x,y,z) coordinates.
---
 include/bout/tokamak_coordinates.hxx | 12 ++++++++++++
 src/mesh/tokamak_coordinates.cxx     |  9 ++++++++-
 2 files changed, 20 insertions(+), 1 deletion(-)

diff --git a/include/bout/tokamak_coordinates.hxx b/include/bout/tokamak_coordinates.hxx
index f13e718787..4b89d3a4ce 100644
--- a/include/bout/tokamak_coordinates.hxx
+++ b/include/bout/tokamak_coordinates.hxx
@@ -11,8 +11,18 @@ using FieldMetric = MetricTensor::FieldMetric;
 
 namespace bout {
 
+    struct Coordinates3D {
+
+        Field3D x;
+        Field3D y;
+        Field3D z;
+
+        Coordinates3D(Field3D x, Field3D y, Field3D z) : x(x), y(y), z(z) {}
+    };
+
     struct TokamakOptions {
         Field2D Rxy;
+        Field2D Zxy;
         Field2D Bpxy;
         Field2D Btxy;
         Field2D Bxy;
@@ -23,6 +33,8 @@ namespace bout {
         TokamakOptions(Mesh &mesh);
 
         void normalise(BoutReal Lbar, BoutReal Bbar, BoutReal ShearFactor);
+
+        Coordinates3D CylindricalCoordinatesToCartesian();
     };
 
     BoutReal get_sign_of_bp(const Field2D &Bpxy);
diff --git a/src/mesh/tokamak_coordinates.cxx b/src/mesh/tokamak_coordinates.cxx
index e5a7636b7d..854ebc7982 100644
--- a/src/mesh/tokamak_coordinates.cxx
+++ b/src/mesh/tokamak_coordinates.cxx
@@ -17,7 +17,7 @@ namespace bout {
 
     TokamakOptions::TokamakOptions(Mesh &mesh) {
         mesh.get(Rxy, "Rxy");
-        //    mesh->get(Zxy, "Zxy");
+        mesh.get(Zxy, "Zxy");
         mesh.get(Bpxy, "Bpxy");
         mesh.get(Btxy, "Btxy");
         mesh.get(Bxy, "Bxy");
@@ -28,6 +28,13 @@ namespace bout {
         }
     }
 
+    Coordinates3D TokamakOptions::CylindricalCoordinatesToCartesian() {
+        Field3D x = Rxy * cos(Zxy);
+        Field3D y = Rxy * sin(Zxy);
+        Field3D z = Rxy * sin(Zxy);
+        return Coordinates3D(x, y, z);
+    }
+
     void TokamakOptions::normalise(BoutReal Lbar, BoutReal Bbar, BoutReal ShearFactor) {
         Rxy /= Lbar;
         Bpxy /= Bbar;

From 4c50b3da8460837e46b4433359e692413b8c4756 Mon Sep 17 00:00:00 2001
From: tomc271 <tomc271@gmail.com>
Date: Mon, 28 Apr 2025 15:00:12 +0100
Subject: [PATCH 044/129] Add test fixture CoordinateTransformTest, and test
 CylindricalToCartesian

---
 tests/unit/CMakeLists.txt                     |  1 +
 .../mesh/test_change_coordinate_system.cxx    | 47 +++++++++++++++++++
 2 files changed, 48 insertions(+)
 create mode 100644 tests/unit/mesh/test_change_coordinate_system.cxx

diff --git a/tests/unit/CMakeLists.txt b/tests/unit/CMakeLists.txt
index 47253c508f..e76a15dd57 100644
--- a/tests/unit/CMakeLists.txt
+++ b/tests/unit/CMakeLists.txt
@@ -67,6 +67,7 @@ set(serial_tests_source
   ./mesh/test_boundary_factory.cxx
   ./mesh/test_boutmesh.cxx
   ./mesh/test_coordinates.cxx
+  ./mesh/test_change_coordinate_system.cxx
   ./mesh/test_coordinates_accessor.cxx
   ./mesh/test_interpolation.cxx
   ./mesh/test_invert3x3.cxx
diff --git a/tests/unit/mesh/test_change_coordinate_system.cxx b/tests/unit/mesh/test_change_coordinate_system.cxx
new file mode 100644
index 0000000000..f96e545fd7
--- /dev/null
+++ b/tests/unit/mesh/test_change_coordinate_system.cxx
@@ -0,0 +1,47 @@
+#include "gtest/gtest.h"
+#include "bout/coordinates.hxx"
+#include "bout/mesh.hxx"
+#include "fake_mesh_fixture.hxx"
+#include <bout/tokamak_coordinates.hxx>
+
+
+using bout::globals::mesh;
+
+class CoordinateTransformTest : public FakeMeshFixture {
+public:
+    using FieldMetric = Coordinates::FieldMetric;
+
+    CoordinateTransformTest() : FakeMeshFixture() {}
+};
+
+TEST_F(CoordinateTransformTest, CylindricalToCartesian) {
+
+    auto tokamak_options = bout::TokamakOptions(*mesh);
+
+    for (int i = 0; i < tokamak_options.Rxy.getNx(); i++) {
+        for (int j = 0; j < tokamak_options.Rxy.getNy(); j++) {
+            tokamak_options.Rxy(i, j) = ((float) i + 1) / 1000 * ((float) j + 1) / 1000;
+        }
+    }
+
+    bout::Coordinates3D cartesian_coords = tokamak_options.CylindricalCoordinatesToCartesian();
+
+    for (int jx = 0; jx < mesh->xstart; jx++) {
+        for (int jy = 0; jy < mesh->ystart; jy++) {
+            for (int jz = 0; jz < mesh->LocalNz; jz++) {
+
+                auto actual_x = cartesian_coords.x(jx, jy, jz);
+                auto actual_y = cartesian_coords.y(jx, jy, jz);
+                auto actual_z = cartesian_coords.z(jx, jy, jz);
+
+                auto expected_x = tokamak_options.Rxy(jx, jy) * cos(tokamak_options.toroidal_angle(jx, jy, jz));
+                auto expected_y = tokamak_options.Rxy(jx, jy) * sin(tokamak_options.toroidal_angle(jx, jy, jz));
+                auto expected_z = tokamak_options.Zxy(jx, jy);
+
+                EXPECT_EQ(actual_x, expected_x);
+                EXPECT_EQ(actual_y, expected_y);
+                EXPECT_EQ(actual_z, expected_z);
+            }
+        }
+    }
+}

From a63f7d6c96b1cd9cc8d950d78bcb246bef98f27e Mon Sep 17 00:00:00 2001
From: tomc271 <tomc271@gmail.com>
Date: Mon, 28 Apr 2025 17:08:44 +0100
Subject: [PATCH 045/129] Fix CylindricalCoordinatesToCartesian()

Add toroidal_angle field to TokamakOptions.
Iterate over all coordinate points.
---
 include/bout/tokamak_coordinates.hxx |  1 +
 src/mesh/tokamak_coordinates.cxx     | 16 +++++++++++++---
 2 files changed, 14 insertions(+), 3 deletions(-)

diff --git a/include/bout/tokamak_coordinates.hxx b/include/bout/tokamak_coordinates.hxx
index 4b89d3a4ce..f75825ad3a 100644
--- a/include/bout/tokamak_coordinates.hxx
+++ b/include/bout/tokamak_coordinates.hxx
@@ -29,6 +29,7 @@ namespace bout {
         Field2D hthe;
         FieldMetric I;
         FieldMetric dx;
+        FieldMetric toroidal_angle;
 
         TokamakOptions(Mesh &mesh);
 
diff --git a/src/mesh/tokamak_coordinates.cxx b/src/mesh/tokamak_coordinates.cxx
index 854ebc7982..0ac5db1a2b 100644
--- a/src/mesh/tokamak_coordinates.cxx
+++ b/src/mesh/tokamak_coordinates.cxx
@@ -26,12 +26,22 @@ namespace bout {
         if (mesh.get(dx, "dpsi")) {
             dx = mesh.getCoordinates()->dx();
         }
+        mesh.get(toroidal_angle, "z");
     }
 
     Coordinates3D TokamakOptions::CylindricalCoordinatesToCartesian() {
-        Field3D x = Rxy * cos(Zxy);
-        Field3D y = Rxy * sin(Zxy);
-        Field3D z = Rxy * sin(Zxy);
+        Field3D x = emptyFrom(Rxy);
+        Field3D y = emptyFrom(Rxy);
+        Field3D z = emptyFrom(Zxy);
+        for (int i = 0; i < toroidal_angle.getNx(); i++) {
+            for (int j = 0; j < toroidal_angle.getNy(); j++) {
+                for (int k = 0; k < toroidal_angle.getNz(); k++) {
+                    x(i, j, k) = Rxy(i, j) * cos(toroidal_angle(i, j, k));
+                    y(i, j, k) = Rxy(i, j) * sin(toroidal_angle(i, j, k));
+                    z(i, j, k) = Zxy(i, j);
+                }
+            }
+        }
         return Coordinates3D(x, y, z);
     }
 

From 71f9429f2e55f35e57baceaf1c096dbcf272c1ae Mon Sep 17 00:00:00 2001
From: tomc271 <tomc271@gmail.com>
Date: Mon, 28 Apr 2025 17:26:52 +0100
Subject: [PATCH 046/129] Fix test CylindricalToCartesian

---
 tests/unit/mesh/test_change_coordinate_system.cxx | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/unit/mesh/test_change_coordinate_system.cxx b/tests/unit/mesh/test_change_coordinate_system.cxx
index f96e545fd7..f6075e5485 100644
--- a/tests/unit/mesh/test_change_coordinate_system.cxx
+++ b/tests/unit/mesh/test_change_coordinate_system.cxx
@@ -26,8 +26,8 @@ TEST_F(CoordinateTransformTest, CylindricalToCartesian) {
 
     bout::Coordinates3D cartesian_coords = tokamak_options.CylindricalCoordinatesToCartesian();
 
-    for (int jx = 0; jx < mesh->xstart; jx++) {
-        for (int jy = 0; jy < mesh->ystart; jy++) {
+    for (int jx = 0; jx < mesh->xend; jx++) {
+        for (int jy = 0; jy < mesh->yend; jy++) {
             for (int jz = 0; jz < mesh->LocalNz; jz++) {
 
                 auto actual_x = cartesian_coords.x(jx, jy, jz);

From 06df2d62bd0df9a813732622a4471a29407d2725 Mon Sep 17 00:00:00 2001
From: tomc271 <tomc271@gmail.com>
Date: Mon, 28 Apr 2025 17:55:43 +0100
Subject: [PATCH 047/129] Calculate toroidal angle, as 2*pi/n

---
 src/mesh/tokamak_coordinates.cxx | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/src/mesh/tokamak_coordinates.cxx b/src/mesh/tokamak_coordinates.cxx
index 0ac5db1a2b..8161acb34a 100644
--- a/src/mesh/tokamak_coordinates.cxx
+++ b/src/mesh/tokamak_coordinates.cxx
@@ -4,6 +4,7 @@
 #include "bout/bout_types.hxx"
 #include "bout/field2d.hxx"
 #include "bout/utils.hxx"
+#include "bout/constants.hxx"
 
 
 namespace bout {
@@ -26,7 +27,8 @@ namespace bout {
         if (mesh.get(dx, "dpsi")) {
             dx = mesh.getCoordinates()->dx();
         }
-        mesh.get(toroidal_angle, "z");
+//        mesh.get(toroidal_angle, "z");
+        toroidal_angle = 2 * PI / Rxy.size();
     }
 
     Coordinates3D TokamakOptions::CylindricalCoordinatesToCartesian() {

From 0ced35ef3c911b77a77e9d1ca0247bdc28ebc30e Mon Sep 17 00:00:00 2001
From: Ben Dudson <dudson2@llnl.gov>
Date: Fri, 2 May 2025 21:10:28 -0700
Subject: [PATCH 048/129] beuler: Add output interpolation

The preconditioner depends on the timestep, so avoid changing
timestep unless necessary. Allow timesteps to go past output time,
then interpolate.

If timesteps are adjusted then recalculate the Jacobian. This
could be optimised to update the Jacobian and recalculate the
preconditioner, without finite differencing the RHS.
---
 src/solver/impls/snes/snes.cxx | 96 ++++++++++++++++++++++++++++------
 src/solver/impls/snes/snes.hxx | 17 +++---
 2 files changed, 89 insertions(+), 24 deletions(-)

diff --git a/src/solver/impls/snes/snes.cxx b/src/solver/impls/snes/snes.cxx
index 4dce1e7086..0e514d56cc 100644
--- a/src/solver/impls/snes/snes.cxx
+++ b/src/solver/impls/snes/snes.cxx
@@ -297,13 +297,21 @@ int SNESSolver::init() {
     SNESSetJacobian(snes, Jmf, Jmf, MatMFFDComputeJacobian, this);
 
   } else {
-    // Calculate the Jacobian using finite differences.
-    // The finite difference Jacobian (Jfd) may be used for both operator
-    // and preconditioner or, if matrix_free_operator, in only the preconditioner.
+    // Calculate the Jacobian using finite differences.  The finite
+    // difference Jacobian (Jfd) may be used for both operator and
+    // preconditioner or, if matrix_free_operator, in only the
+    // preconditioner.
+
+    // Create a vector to store interpolated output solution
+    // Used so that the timestep does not have to be adjusted,
+    // because that would require updating the preconditioner.
+    ierr = VecDuplicate(snes_x, &output_x);
+    CHKERRQ(ierr);
+
     if (use_coloring) {
-      // Use matrix coloring
-      // This greatly reduces the number of times the rhs() function needs
-      // to be evaluated when calculating the Jacobian.
+      // Use matrix coloring.
+      // This greatly reduces the number of times the rhs() function
+      // needs to be evaluated when calculating the Jacobian.
 
       // Use global mesh for now
       Mesh* mesh = bout::globals::mesh;
@@ -717,14 +725,17 @@ int SNESSolver::run() {
     CHKERRQ(ierr);
   }
 
+  BoutReal target = simtime;
   for (int s = 0; s < getNumberOutputSteps(); s++) {
-    BoutReal target = simtime + getOutputTimestep();
+    target += getOutputTimestep();
 
     bool looping = true;
     int snes_failures = 0; // Count SNES convergence failures
     int saved_jacobian_lag = 0;
     int loop_count = 0;
     do {
+      if (simtime >= target)
+        break; // Could happen if step over multiple outputs
       if (scale_vars) {
         // Individual variable scaling
         // Note: If variables are rescaled then the Jacobian columns
@@ -802,9 +813,15 @@ int SNESSolver::run() {
       dt = timestep;
       looping = true;
       if (simtime + dt >= target) {
-        // Ensure that the timestep goes to the next output time and then stops
+        // Note: When the timestep is changed the preconditioner needs to be updated
+        // => Step over the output time and interpolate if not matrix free
+
+        if (matrix_free) {
+          // Ensure that the timestep goes to the next output time and then stops.
+          // This avoids the need to interpolate
+          dt = target - simtime;
+        }
         looping = false;
-        dt = target - simtime;
       }
 
       if (predictor and (time1 > 0.0)) {
@@ -872,6 +889,7 @@ int SNESSolver::run() {
           jacobian_pruned = false; // Reset flag. Will be set after pruning.
         }
         if (saved_jacobian_lag == 0) {
+          // This triggers a Jacobian recalculation
           SNESGetLagJacobian(snes, &saved_jacobian_lag);
           SNESSetLagJacobian(snes, 1);
         }
@@ -1003,24 +1021,70 @@ int SNESSolver::run() {
 #endif // PETSC_VERSION_GE(3,20,0)
 
       if (looping) {
-        if (nl_its <= lower_its) {
+        // Consider changing the timestep.
+        // Note: The preconditioner depends on the timestep,
+        // so if it is not recalculated the it will be less
+        // effective.
+        if ((nl_its <= lower_its) && (timestep < max_timestep)) {
           // Increase timestep slightly
           timestep *= 1.1;
 
           if (timestep > max_timestep) {
             timestep = max_timestep;
           }
+
+          // Note: Setting the SNESJacobianFn to NULL retains
+          // previously set evaluation function.
+          //
+          // The SNES Jacobian is a combination of the RHS Jacobian
+          // and a factor involving the timestep.
+          // Depends on equation_form
+          // -> Probably call SNESSetJacobian(snes, Jfd, Jfd, NULL, fdcoloring);
+
+          // Recompute Jacobian (for now)
+          if (saved_jacobian_lag == 0) {
+            SNESGetLagJacobian(snes, &saved_jacobian_lag);
+            SNESSetLagJacobian(snes, 1);
+          }
+
         } else if (nl_its >= upper_its) {
           // Reduce timestep slightly
           timestep *= 0.9;
+
+          // Recompute Jacobian
+          if (saved_jacobian_lag == 0) {
+            SNESGetLagJacobian(snes, &saved_jacobian_lag);
+            SNESSetLagJacobian(snes, 1);
+          }
         }
       }
     } while (looping);
 
+    if (!matrix_free) {
+      ASSERT2(simtime >= target);
+      ASSERT2(simtime - dt < target);
+      // Stepped over output timestep => Interpolate
+      // snes_x is the solution at t = simtime
+      // x0 is the solution at t = simtime - dt
+      // Calculate output_x at t = target
+      VecCopy(snes_x, output_x);
+
+      // Note: If simtime = target then alpha = 0
+      //       and output_x = snes_x
+      BoutReal alpha = (simtime - target) / dt;
+
+      // output_x <- alpha * x0 + (1 - alpha) * output_x
+      VecAXPBY(output_x, alpha, 1. - alpha, x0);
+
+    } else {
+      // Timestep was adjusted to hit target output time
+      output_x = snes_x;
+    }
+
     // Put the result into variables
     if (scale_vars) {
-      // scaled_x <- snes_x * var_scaling_factors
-      int ierr = VecPointwiseMult(scaled_x, snes_x, var_scaling_factors);
+      // scaled_x <- output_x * var_scaling_factors
+      int ierr = VecPointwiseMult(scaled_x, output_x, var_scaling_factors);
       CHKERRQ(ierr);
 
       const BoutReal* xdata = nullptr;
@@ -1031,15 +1095,15 @@ int SNESSolver::run() {
       CHKERRQ(ierr);
     } else {
       const BoutReal* xdata = nullptr;
-      int ierr = VecGetArrayRead(snes_x, &xdata);
+      int ierr = VecGetArrayRead(output_x, &xdata);
       CHKERRQ(ierr);
       load_vars(const_cast<BoutReal*>(xdata));
-      ierr = VecRestoreArrayRead(snes_x, &xdata);
+      ierr = VecRestoreArrayRead(output_x, &xdata);
       CHKERRQ(ierr);
     }
-    run_rhs(simtime); // Run RHS to calculate auxilliary variables
+    run_rhs(target); // Run RHS to calculate auxilliary variables
 
-    if (call_monitors(simtime, s, getNumberOutputSteps()) != 0) {
+    if (call_monitors(target, s, getNumberOutputSteps()) != 0) {
       break; // User signalled to quit
     }
   }
diff --git a/src/solver/impls/snes/snes.hxx b/src/solver/impls/snes/snes.hxx
index 17050ad775..187a64fb40 100644
--- a/src/solver/impls/snes/snes.hxx
+++ b/src/solver/impls/snes/snes.hxx
@@ -4,7 +4,7 @@
  * using PETSc for the SNES interface
  *
  **************************************************************************
- * Copyright 2015-2024 BOUT++ contributors
+ * Copyright 2015-2025 BOUT++ contributors
  *
  * Contact: Ben Dudson, dudson2@llnl.gov
  *
@@ -116,14 +116,15 @@ private:
   Vec snes_x;   ///< Result of SNES
   Vec x0;       ///< Solution at start of current timestep
   Vec delta_x;  ///< Change in solution
+  Vec output_x; ///< Solution to output. Used if interpolating.
 
   bool predictor;       ///< Use linear predictor?
   Vec x1;               ///< Previous solution
   BoutReal time1{-1.0}; ///< Time of previous solution
 
-  SNES snes;                ///< SNES context
-  Mat Jmf;                  ///< Matrix Free Jacobian
-  Mat Jfd;                  ///< Finite Difference Jacobian
+  SNES snes;                         ///< SNES context
+  Mat Jmf;                           ///< Matrix Free Jacobian
+  Mat Jfd;                           ///< Finite Difference Jacobian
   MatFDColoring fdcoloring{nullptr}; ///< Matrix coloring context
                                      ///< Jacobian evaluation
 
@@ -135,10 +136,10 @@ private:
   std::string pc_hypre_type;      ///< Hypre preconditioner type
   std::string line_search_type;   ///< Line search type
 
-  bool matrix_free;               ///< Use matrix free Jacobian
-  bool matrix_free_operator;      ///< Use matrix free Jacobian in the operator?
-  int lag_jacobian;               ///< Re-use Jacobian
-  bool use_coloring;              ///< Use matrix coloring
+  bool matrix_free;          ///< Use matrix free Jacobian
+  bool matrix_free_operator; ///< Use matrix free Jacobian in the operator?
+  int lag_jacobian;          ///< Re-use Jacobian
+  bool use_coloring;         ///< Use matrix coloring
 
   bool jacobian_recalculated; ///< Flag set when Jacobian is recalculated
   bool prune_jacobian;        ///< Remove small elements in the Jacobian?

From 8159339f67e2d3f8032ac5ae146e088841879bdf Mon Sep 17 00:00:00 2001
From: Ben Dudson <dudson2@llnl.gov>
Date: Sat, 3 May 2025 11:26:30 -0700
Subject: [PATCH 049/129] snes: Make timestep adjustment tunable

New tunable inputs for adjustment when timestep fails, and when number
of iterations is either too high or too low.
---
 src/solver/impls/snes/snes.cxx | 33 ++++++++++++++++++++++++---------
 src/solver/impls/snes/snes.hxx |  4 ++++
 2 files changed, 28 insertions(+), 9 deletions(-)

diff --git a/src/solver/impls/snes/snes.cxx b/src/solver/impls/snes/snes.cxx
index 0e514d56cc..780019e5b3 100644
--- a/src/solver/impls/snes/snes.cxx
+++ b/src/solver/impls/snes/snes.cxx
@@ -123,6 +123,15 @@ SNESSolver::SNESSolver(Options* opts)
       upper_its((*options)["upper_its"]
                     .doc("Iterations above which the next timestep is reduced")
                     .withDefault(static_cast<int>(maxits * 0.8))),
+      timestep_factor_on_failure((*options)["timestep_factor_on_failure"]
+                                 .doc("Multiply timestep on convergence failure")
+                                 .withDefault(0.5)),
+      timestep_factor_on_upper_its((*options)["timestep_factor_on_upper_its"]
+                                   .doc("Multiply timestep if iterations exceed upper_its")
+                                   .withDefault(0.9)),
+      timestep_factor_on_lower_its((*options)["timestep_factor_on_lower_its"]
+                                   .doc("Multiply timestep if iterations are below lower_its")
+                                   .withDefault(1.4)),
       diagnose(
           (*options)["diagnose"].doc("Print additional diagnostics").withDefault(false)),
       diagnose_failures((*options)["diagnose_failures"]
@@ -731,6 +740,7 @@ int SNESSolver::run() {
 
     bool looping = true;
     int snes_failures = 0; // Count SNES convergence failures
+    int steps_since_snes_failure = 0;
     int saved_jacobian_lag = 0;
     int loop_count = 0;
     do {
@@ -868,9 +878,10 @@ int SNESSolver::run() {
         }
 
         ++snes_failures;
+        steps_since_snes_failure = 0;
 
         // Try a smaller timestep
-        timestep /= 2.0;
+        timestep *= timestep_factor_on_failure;
         // Restore state
         VecCopy(x0, snes_x);
 
@@ -961,6 +972,7 @@ int SNESSolver::run() {
       }
 
       simtime += dt;
+      ++steps_since_snes_failure;
 
       if (diagnose) {
         // Gather and print diagnostic information
@@ -970,7 +982,6 @@ int SNESSolver::run() {
                      simtime, timestep, nl_its, lin_its, static_cast<int>(reason));
         if (snes_failures > 0) {
           output.write(", SNES failures: {}", snes_failures);
-          snes_failures = 0;
         }
         output.write("\n");
       }
@@ -1025,9 +1036,10 @@ int SNESSolver::run() {
         // Note: The preconditioner depends on the timestep,
         // so if it is not recalculated the it will be less
         // effective.
-        if ((nl_its <= lower_its) && (timestep < max_timestep)) {
+        if ((nl_its <= lower_its) && (timestep < max_timestep)
+            && (steps_since_snes_failure > 2)) {
           // Increase timestep slightly
-          timestep *= 1.1;
+          timestep *= timestep_factor_on_lower_its;
 
           if (timestep > max_timestep) {
             timestep = max_timestep;
@@ -1041,15 +1053,17 @@ int SNESSolver::run() {
           // Depends on equation_form
           // -> Probably call SNESSetJacobian(snes, Jfd, Jfd, NULL, fdcoloring);
 
-          // Recompute Jacobian (for now)
-          if (saved_jacobian_lag == 0) {
-            SNESGetLagJacobian(snes, &saved_jacobian_lag);
-            SNESSetLagJacobian(snes, 1);
+          if (static_cast<BoutReal>(lin_its) / nl_its > 4) {
+            // Recompute Jacobian (for now)
+            if (saved_jacobian_lag == 0) {
+              SNESGetLagJacobian(snes, &saved_jacobian_lag);
+              SNESSetLagJacobian(snes, 1);
+            }
           }
 
         } else if (nl_its >= upper_its) {
           // Reduce timestep slightly
-          timestep *= 0.9;
+          timestep *= timestep_factor_on_upper_its;
 
           // Recompute Jacobian
           if (saved_jacobian_lag == 0) {
@@ -1058,6 +1072,7 @@ int SNESSolver::run() {
           }
         }
       }
+      snes_failures = 0;
     } while (looping);
 
     if (!matrix_free) {
diff --git a/src/solver/impls/snes/snes.hxx b/src/solver/impls/snes/snes.hxx
index 187a64fb40..cba2352582 100644
--- a/src/solver/impls/snes/snes.hxx
+++ b/src/solver/impls/snes/snes.hxx
@@ -102,6 +102,10 @@ private:
   int maxits;               ///< Maximum nonlinear iterations
   int lower_its, upper_its; ///< Limits on iterations for timestep adjustment
 
+  BoutReal timestep_factor_on_failure;
+  BoutReal timestep_factor_on_upper_its;
+  BoutReal timestep_factor_on_lower_its;
+
   bool diagnose;          ///< Output additional diagnostics
   bool diagnose_failures; ///< Print diagnostics on SNES failures
 

From 1d7ab067d57773111206d7895e6ee12d614d1ded Mon Sep 17 00:00:00 2001
From: Ben Dudson <dudson2@llnl.gov>
Date: Fri, 9 May 2025 16:46:51 -0700
Subject: [PATCH 050/129] periodicX communication fixes

- Fix mesh::(send/recv)X(In/Out) so that it works with periodicX=true

- FV::communicateFluxes now communicates when periodicX=true
---
 src/mesh/fv_ops.cxx              |  5 ++-
 src/mesh/impls/bout/boutmesh.cxx | 64 ++++++++++++++++++++++++--------
 2 files changed, 51 insertions(+), 18 deletions(-)

diff --git a/src/mesh/fv_ops.cxx b/src/mesh/fv_ops.cxx
index cd5b924e9e..fe5422b4d1 100644
--- a/src/mesh/fv_ops.cxx
+++ b/src/mesh/fv_ops.cxx
@@ -442,8 +442,9 @@ void communicateFluxes(Field3D& f) {
   comm_handle xin, xout;
   // Cache results to silence spurious compiler warning about xin,
   // xout possibly being uninitialised when used
-  bool not_first = !mesh->firstX();
-  bool not_last = !mesh->lastX();
+  const bool not_first = mesh->periodicX || !mesh->firstX();
+  const bool not_last = mesh->periodicX || !mesh->lastX();
+
   if (not_first) {
     xin = mesh->irecvXIn(f(0, 0), size, 0);
   }
diff --git a/src/mesh/impls/bout/boutmesh.cxx b/src/mesh/impls/bout/boutmesh.cxx
index 16061cd47e..31e9c6112d 100644
--- a/src/mesh/impls/bout/boutmesh.cxx
+++ b/src/mesh/impls/bout/boutmesh.cxx
@@ -1534,42 +1534,66 @@ bool BoutMesh::firstX() const { return PE_XIND == 0; }
 bool BoutMesh::lastX() const { return PE_XIND == NXPE - 1; }
 
 int BoutMesh::sendXOut(BoutReal* buffer, int size, int tag) {
+  Timer timer("comms");
+
+  int proc {-1};
   if (PE_XIND == NXPE - 1) {
-    return 1;
+    if (periodicX) {
+      // Wrap around to first processor in X
+      proc = PROC_NUM(0, PE_YIND);
+    } else {
+      return 1;
+    }
+  } else {
+    proc = PROC_NUM(PE_XIND + 1, PE_YIND);
   }
 
-  Timer timer("comms");
-
-  mpi->MPI_Send(buffer, size, PVEC_REAL_MPI_TYPE, PROC_NUM(PE_XIND + 1, PE_YIND), tag,
+  mpi->MPI_Send(buffer, size, PVEC_REAL_MPI_TYPE, proc, tag,
                 BoutComm::get());
 
   return 0;
 }
 
 int BoutMesh::sendXIn(BoutReal* buffer, int size, int tag) {
+  Timer timer("comms");
+
+  int proc {-1};
   if (PE_XIND == 0) {
-    return 1;
+    if (periodicX) {
+      // Wrap around to last processor in X
+      proc = PROC_NUM(NXPE - 1, PE_YIND);
+    } else {
+      return 1;
+    }
+  } else {
+    proc = PROC_NUM(PE_XIND - 1, PE_YIND);
   }
 
-  Timer timer("comms");
-
-  mpi->MPI_Send(buffer, size, PVEC_REAL_MPI_TYPE, PROC_NUM(PE_XIND - 1, PE_YIND), tag,
+  mpi->MPI_Send(buffer, size, PVEC_REAL_MPI_TYPE, proc, tag,
                 BoutComm::get());
 
   return 0;
 }
 
 comm_handle BoutMesh::irecvXOut(BoutReal* buffer, int size, int tag) {
+  Timer timer("comms");
+
+  int proc {-1};
   if (PE_XIND == NXPE - 1) {
-    return nullptr;
+    if (periodicX) {
+      // Wrap around to first processor in X
+      proc = PROC_NUM(0, PE_YIND);
+    } else {
+      return nullptr;
+    }
+  } else {
+    proc = PROC_NUM(PE_XIND + 1, PE_YIND);
   }
 
-  Timer timer("comms");
-
   // Get a communications handle. Not fussy about size of arrays
   CommHandle* ch = get_handle(0, 0);
 
-  mpi->MPI_Irecv(buffer, size, PVEC_REAL_MPI_TYPE, PROC_NUM(PE_XIND + 1, PE_YIND), tag,
+  mpi->MPI_Irecv(buffer, size, PVEC_REAL_MPI_TYPE, proc, tag,
                  BoutComm::get(), ch->request);
 
   ch->in_progress = true;
@@ -1578,16 +1602,24 @@ comm_handle BoutMesh::irecvXOut(BoutReal* buffer, int size, int tag) {
 }
 
 comm_handle BoutMesh::irecvXIn(BoutReal* buffer, int size, int tag) {
+  Timer timer("comms");
+
+  int proc {-1};
   if (PE_XIND == 0) {
-    return nullptr;
+    if (periodicX) {
+      // Wrap around to last processor in X
+      proc = PROC_NUM(NXPE - 1, PE_YIND);
+    } else {
+      return nullptr;
+    }
+  } else {
+    proc = PROC_NUM(PE_XIND - 1, PE_YIND);
   }
 
-  Timer timer("comms");
-
   // Get a communications handle. Not fussy about size of arrays
   CommHandle* ch = get_handle(0, 0);
 
-  mpi->MPI_Irecv(buffer, size, PVEC_REAL_MPI_TYPE, PROC_NUM(PE_XIND - 1, PE_YIND), tag,
+  mpi->MPI_Irecv(buffer, size, PVEC_REAL_MPI_TYPE, proc, tag,
                  BoutComm::get(), ch->request);
 
   ch->in_progress = true;

From 49ae23b3ebd76e30f972855314764d3b860386e1 Mon Sep 17 00:00:00 2001
From: tomc271 <tomc271@gmail.com>
Date: Mon, 28 Apr 2025 17:56:38 +0100
Subject: [PATCH 051/129] Modify generation of test values for Rxy

---
 tests/unit/mesh/test_change_coordinate_system.cxx | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/unit/mesh/test_change_coordinate_system.cxx b/tests/unit/mesh/test_change_coordinate_system.cxx
index f6075e5485..f1498a4982 100644
--- a/tests/unit/mesh/test_change_coordinate_system.cxx
+++ b/tests/unit/mesh/test_change_coordinate_system.cxx
@@ -20,7 +20,7 @@ TEST_F(CoordinateTransformTest, CylindricalToCartesian) {
 
     for (int i = 0; i < tokamak_options.Rxy.getNx(); i++) {
         for (int j = 0; j < tokamak_options.Rxy.getNy(); j++) {
-            tokamak_options.Rxy(i, j) = ((float) i + 1) / 1000 * ((float) j + 1) / 1000;
+            tokamak_options.Rxy(i, j) = sqrt(SQ(i) + SQ(j));
         }
     }
 

From 5387b8a1e2f64cbcfb353706daf3e988b893491e Mon Sep 17 00:00:00 2001
From: tomc271 <tomc271@gmail.com>
Date: Wed, 14 May 2025 16:13:51 +0100
Subject: [PATCH 052/129] Use a realistic set of test points as input

---
 tests/unit/mesh/test_change_coordinate_system.cxx | 10 ++++++++--
 1 file changed, 8 insertions(+), 2 deletions(-)

diff --git a/tests/unit/mesh/test_change_coordinate_system.cxx b/tests/unit/mesh/test_change_coordinate_system.cxx
index f1498a4982..5edab230cf 100644
--- a/tests/unit/mesh/test_change_coordinate_system.cxx
+++ b/tests/unit/mesh/test_change_coordinate_system.cxx
@@ -2,6 +2,7 @@
 #include "bout/coordinates.hxx"
 #include "bout/mesh.hxx"
 #include "fake_mesh_fixture.hxx"
+#include "bout/constants.hxx"
 #include <bout/tokamak_coordinates.hxx>
 
 
@@ -16,11 +17,16 @@ class CoordinateTransformTest : public FakeMeshFixture {
 
 TEST_F(CoordinateTransformTest, CylindricalToCartesian) {
 
+    double R0 = 2.0;  // major radius
+    double r[9] = {0.10, 0.15, 0.20, 0.25, 0.30};  // minor radius
+    double theta[3] = {1.07712, 3.17151, 5.26591};  // poloidal angle
+
     auto tokamak_options = bout::TokamakOptions(*mesh);
 
     for (int i = 0; i < tokamak_options.Rxy.getNx(); i++) {
-        for (int j = 0; j < tokamak_options.Rxy.getNy(); j++) {
-            tokamak_options.Rxy(i, j) = sqrt(SQ(i) + SQ(j));
+        for (int j = 0; j < tokamak_options.Zxy.getNy(); j++) {
+            tokamak_options.Rxy(i, j) = R0 + r[i] * cos(theta[j]);
+            tokamak_options.Zxy(i, j) = r[i] * sin(theta[j]);
         }
     }
 

From c1ed640c4eeb663be1d9083d645ca8f633b2b680 Mon Sep 17 00:00:00 2001
From: tomc271 <tomc271@gmail.com>
Date: Wed, 21 May 2025 14:01:56 +0100
Subject: [PATCH 053/129] Use standard library functions for sin() and cos()

---
 src/mesh/tokamak_coordinates.cxx                  | 4 ++--
 tests/unit/mesh/test_change_coordinate_system.cxx | 8 ++++----
 2 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/src/mesh/tokamak_coordinates.cxx b/src/mesh/tokamak_coordinates.cxx
index 8161acb34a..5f22b415e3 100644
--- a/src/mesh/tokamak_coordinates.cxx
+++ b/src/mesh/tokamak_coordinates.cxx
@@ -38,8 +38,8 @@ namespace bout {
         for (int i = 0; i < toroidal_angle.getNx(); i++) {
             for (int j = 0; j < toroidal_angle.getNy(); j++) {
                 for (int k = 0; k < toroidal_angle.getNz(); k++) {
-                    x(i, j, k) = Rxy(i, j) * cos(toroidal_angle(i, j, k));
-                    y(i, j, k) = Rxy(i, j) * sin(toroidal_angle(i, j, k));
+                    x(i, j, k) = Rxy(i, j) * std::cos(toroidal_angle(i, j, k));
+                    y(i, j, k) = Rxy(i, j) * std::sin(toroidal_angle(i, j, k));
                     z(i, j, k) = Zxy(i, j);
                 }
             }
diff --git a/tests/unit/mesh/test_change_coordinate_system.cxx b/tests/unit/mesh/test_change_coordinate_system.cxx
index 5edab230cf..8651c17478 100644
--- a/tests/unit/mesh/test_change_coordinate_system.cxx
+++ b/tests/unit/mesh/test_change_coordinate_system.cxx
@@ -25,8 +25,8 @@ TEST_F(CoordinateTransformTest, CylindricalToCartesian) {
 
     for (int i = 0; i < tokamak_options.Rxy.getNx(); i++) {
         for (int j = 0; j < tokamak_options.Zxy.getNy(); j++) {
-            tokamak_options.Rxy(i, j) = R0 + r[i] * cos(theta[j]);
-            tokamak_options.Zxy(i, j) = r[i] * sin(theta[j]);
+            tokamak_options.Rxy(i, j) = R0 + r[i] * std::cos(theta[j]);
+            tokamak_options.Zxy(i, j) = r[i] * std::sin(theta[j]);
         }
     }
 
@@ -40,8 +40,8 @@ TEST_F(CoordinateTransformTest, CylindricalToCartesian) {
                 auto actual_y = cartesian_coords.y(jx, jy, jz);
                 auto actual_z = cartesian_coords.z(jx, jy, jz);
 
-                auto expected_x = tokamak_options.Rxy(jx, jy) * cos(tokamak_options.toroidal_angle(jx, jy, jz));
-                auto expected_y = tokamak_options.Rxy(jx, jy) * sin(tokamak_options.toroidal_angle(jx, jy, jz));
+                auto expected_x = tokamak_options.Rxy(jx, jy) * std::cos(tokamak_options.toroidal_angle(jx, jy, jz));
+                auto expected_y = tokamak_options.Rxy(jx, jy) * std::sin(tokamak_options.toroidal_angle(jx, jy, jz));
                 auto expected_z = tokamak_options.Zxy(jx, jy);
 
                 EXPECT_EQ(actual_x, expected_x);

From e6e1d6215401fc69012e01502e5c03f94fd8cd79 Mon Sep 17 00:00:00 2001
From: tomc271 <tomc271@gmail.com>
Date: Fri, 16 May 2025 10:03:05 +0100
Subject: [PATCH 054/129] Use a vector for the toroidal angle values. Iterate
 over all r, theta values

---
 include/bout/tokamak_coordinates.hxx          |  2 +-
 src/mesh/tokamak_coordinates.cxx              | 19 ++++++++++++-------
 .../mesh/test_change_coordinate_system.cxx    | 16 ++++++++--------
 3 files changed, 21 insertions(+), 16 deletions(-)

diff --git a/include/bout/tokamak_coordinates.hxx b/include/bout/tokamak_coordinates.hxx
index f75825ad3a..7075cf8ccf 100644
--- a/include/bout/tokamak_coordinates.hxx
+++ b/include/bout/tokamak_coordinates.hxx
@@ -29,7 +29,7 @@ namespace bout {
         Field2D hthe;
         FieldMetric I;
         FieldMetric dx;
-        FieldMetric toroidal_angle;
+        std::vector<double> toroidal_angles;
 
         TokamakOptions(Mesh &mesh);
 
diff --git a/src/mesh/tokamak_coordinates.cxx b/src/mesh/tokamak_coordinates.cxx
index 5f22b415e3..e6272035df 100644
--- a/src/mesh/tokamak_coordinates.cxx
+++ b/src/mesh/tokamak_coordinates.cxx
@@ -28,18 +28,23 @@ namespace bout {
             dx = mesh.getCoordinates()->dx();
         }
 //        mesh.get(toroidal_angle, "z");
-        toroidal_angle = 2 * PI / Rxy.size();
+        const auto d_phi = TWOPI / mesh.LocalNz;
+        auto current_phi = 0.0;
+        for (int k = 0; k < mesh.LocalNz; k++) {
+            toroidal_angles.push_back(current_phi);
+            current_phi += d_phi;
+        }
     }
 
     Coordinates3D TokamakOptions::CylindricalCoordinatesToCartesian() {
         Field3D x = emptyFrom(Rxy);
         Field3D y = emptyFrom(Rxy);
         Field3D z = emptyFrom(Zxy);
-        for (int i = 0; i < toroidal_angle.getNx(); i++) {
-            for (int j = 0; j < toroidal_angle.getNy(); j++) {
-                for (int k = 0; k < toroidal_angle.getNz(); k++) {
-                    x(i, j, k) = Rxy(i, j) * std::cos(toroidal_angle(i, j, k));
-                    y(i, j, k) = Rxy(i, j) * std::sin(toroidal_angle(i, j, k));
+        for (int i = 0; i < Rxy.getNx(); i++) {
+            for (int j = 0; j < Rxy.getNy(); j++) {
+                for (uint k = 0; k < toroidal_angles.size(); k++) {
+                    x(i, j, k) = Rxy(i, j) * cos(toroidal_angles[k]);
+                    y(i, j, k) = Rxy(i, j) * sin(toroidal_angles[k]);
                     z(i, j, k) = Zxy(i, j);
                 }
             }
@@ -66,7 +71,7 @@ namespace bout {
 
         const BoutReal sign_of_bp = get_sign_of_bp(tokamak_options.Bpxy);
 
-        auto *coord = mesh.getCoordinates();
+        auto* coord = mesh.getCoordinates();
 
         const auto g11 = SQ(tokamak_options.Rxy * tokamak_options.Bpxy);
         const auto g22 = 1.0 / SQ(tokamak_options.hthe);
diff --git a/tests/unit/mesh/test_change_coordinate_system.cxx b/tests/unit/mesh/test_change_coordinate_system.cxx
index 8651c17478..2fedadb3c2 100644
--- a/tests/unit/mesh/test_change_coordinate_system.cxx
+++ b/tests/unit/mesh/test_change_coordinate_system.cxx
@@ -18,15 +18,15 @@ class CoordinateTransformTest : public FakeMeshFixture {
 TEST_F(CoordinateTransformTest, CylindricalToCartesian) {
 
     double R0 = 2.0;  // major radius
-    double r[9] = {0.10, 0.15, 0.20, 0.25, 0.30};  // minor radius
-    double theta[3] = {1.07712, 3.17151, 5.26591};  // poloidal angle
+    std::array<double, 5> r = {0.10, 0.15, 0.20, 0.25, 0.30};  // minor radius
+    std::array<double, 4> theta = {0.0, 1.07712, 3.17151, 5.26591};  // poloidal angle
 
     auto tokamak_options = bout::TokamakOptions(*mesh);
 
-    for (int i = 0; i < tokamak_options.Rxy.getNx(); i++) {
-        for (int j = 0; j < tokamak_options.Zxy.getNy(); j++) {
-            tokamak_options.Rxy(i, j) = R0 + r[i] * std::cos(theta[j]);
-            tokamak_options.Zxy(i, j) = r[i] * std::sin(theta[j]);
+    for (int i = 0; i < r.size(); i++) {
+        for (int j = 0; j < theta.size(); j++) {
+            tokamak_options.Rxy(i, j) = R0 + r[i] * cos(theta[j]);
+            tokamak_options.Zxy(i, j) = r[i] * sin(theta[j]);
         }
     }
 
@@ -40,8 +40,8 @@ TEST_F(CoordinateTransformTest, CylindricalToCartesian) {
                 auto actual_y = cartesian_coords.y(jx, jy, jz);
                 auto actual_z = cartesian_coords.z(jx, jy, jz);
 
-                auto expected_x = tokamak_options.Rxy(jx, jy) * std::cos(tokamak_options.toroidal_angle(jx, jy, jz));
-                auto expected_y = tokamak_options.Rxy(jx, jy) * std::sin(tokamak_options.toroidal_angle(jx, jy, jz));
+                auto expected_x = tokamak_options.Rxy(jx, jy) * std::cos(tokamak_options.toroidal_angles[jz]);
+                auto expected_y = tokamak_options.Rxy(jx, jy) * std::sin(tokamak_options.toroidal_angles[jz]);
                 auto expected_z = tokamak_options.Zxy(jx, jy);
 
                 EXPECT_EQ(actual_x, expected_x);

From bd86979c3199f16a347c22d08fb7358628759abb Mon Sep 17 00:00:00 2001
From: tomc271 <tomc271@gmail.com>
Date: Wed, 21 May 2025 13:53:59 +0100
Subject: [PATCH 055/129] Prefer const

---
 tests/unit/mesh/test_change_coordinate_system.cxx | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/tests/unit/mesh/test_change_coordinate_system.cxx b/tests/unit/mesh/test_change_coordinate_system.cxx
index 2fedadb3c2..6b84fcac34 100644
--- a/tests/unit/mesh/test_change_coordinate_system.cxx
+++ b/tests/unit/mesh/test_change_coordinate_system.cxx
@@ -17,9 +17,9 @@ class CoordinateTransformTest : public FakeMeshFixture {
 
 TEST_F(CoordinateTransformTest, CylindricalToCartesian) {
 
-    double R0 = 2.0;  // major radius
-    std::array<double, 5> r = {0.10, 0.15, 0.20, 0.25, 0.30};  // minor radius
-    std::array<double, 4> theta = {0.0, 1.07712, 3.17151, 5.26591};  // poloidal angle
+    const double R0 = 2.0;  // major radius
+    const std::array<double, 5> r = {0.10, 0.15, 0.20, 0.25, 0.30};  // minor radius
+    const std::array<double, 4> theta = {0.0, 1.07712, 3.17151, 5.26591};  // poloidal angle
 
     auto tokamak_options = bout::TokamakOptions(*mesh);
 

From 392ae19537e3ee1f371c4f49f668892109b14420 Mon Sep 17 00:00:00 2001
From: tomc271 <tomc271@gmail.com>
Date: Wed, 21 May 2025 13:57:47 +0100
Subject: [PATCH 056/129] Use range-based loops

---
 src/mesh/tokamak_coordinates.cxx                 |  8 +++++---
 .../unit/mesh/test_change_coordinate_system.cxx  | 16 ++++++++++------
 2 files changed, 15 insertions(+), 9 deletions(-)

diff --git a/src/mesh/tokamak_coordinates.cxx b/src/mesh/tokamak_coordinates.cxx
index e6272035df..a8ceab74f1 100644
--- a/src/mesh/tokamak_coordinates.cxx
+++ b/src/mesh/tokamak_coordinates.cxx
@@ -42,10 +42,12 @@ namespace bout {
         Field3D z = emptyFrom(Zxy);
         for (int i = 0; i < Rxy.getNx(); i++) {
             for (int j = 0; j < Rxy.getNy(); j++) {
-                for (uint k = 0; k < toroidal_angles.size(); k++) {
-                    x(i, j, k) = Rxy(i, j) * cos(toroidal_angles[k]);
-                    y(i, j, k) = Rxy(i, j) * sin(toroidal_angles[k]);
+                int k = 0;
+                for (int angle : toroidal_angles) {
+                    x(i, j, k) = Rxy(i, j) * std::cos(angle);
+                    y(i, j, k) = Rxy(i, j) * std::sin(angle);
                     z(i, j, k) = Zxy(i, j);
+                    k++;
                 }
             }
         }
diff --git a/tests/unit/mesh/test_change_coordinate_system.cxx b/tests/unit/mesh/test_change_coordinate_system.cxx
index 6b84fcac34..cf954bd51f 100644
--- a/tests/unit/mesh/test_change_coordinate_system.cxx
+++ b/tests/unit/mesh/test_change_coordinate_system.cxx
@@ -18,16 +18,20 @@ class CoordinateTransformTest : public FakeMeshFixture {
 TEST_F(CoordinateTransformTest, CylindricalToCartesian) {
 
     const double R0 = 2.0;  // major radius
-    const std::array<double, 5> r = {0.10, 0.15, 0.20, 0.25, 0.30};  // minor radius
-    const std::array<double, 4> theta = {0.0, 1.07712, 3.17151, 5.26591};  // poloidal angle
+    const std::array<double, 5> r_values = {0.10, 0.15, 0.20, 0.25, 0.30};  // minor radius
+    const std::array<double, 4> theta_values = {0.0, 1.07712, 3.17151, 5.26591};  // poloidal angle
 
     auto tokamak_options = bout::TokamakOptions(*mesh);
 
-    for (int i = 0; i < r.size(); i++) {
-        for (int j = 0; j < theta.size(); j++) {
-            tokamak_options.Rxy(i, j) = R0 + r[i] * cos(theta[j]);
-            tokamak_options.Zxy(i, j) = r[i] * sin(theta[j]);
+    int i = 0;
+    for (auto r: r_values) {
+        int j = 0;
+        for (auto theta: theta_values) {
+            tokamak_options.Rxy(i, j) = R0 + r * std::cos(theta);
+            tokamak_options.Zxy(i, j) = r * std::sin(theta);
+            j++;
         }
+        i++;
     }
 
     bout::Coordinates3D cartesian_coords = tokamak_options.CylindricalCoordinatesToCartesian();

From 25c850e7cd77b2a364e16854cd57b0f8edbac7b4 Mon Sep 17 00:00:00 2001
From: tomc271 <tomc271@gmail.com>
Date: Wed, 21 May 2025 13:55:20 +0100
Subject: [PATCH 057/129] Pass parameters by reference

---
 include/bout/tokamak_coordinates.hxx | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/include/bout/tokamak_coordinates.hxx b/include/bout/tokamak_coordinates.hxx
index 7075cf8ccf..dd1629799c 100644
--- a/include/bout/tokamak_coordinates.hxx
+++ b/include/bout/tokamak_coordinates.hxx
@@ -17,7 +17,7 @@ namespace bout {
         Field3D y;
         Field3D z;
 
-        Coordinates3D(Field3D x, Field3D y, Field3D z) : x(x), y(y), z(z) {}
+        Coordinates3D(Field3D& x, Field3D& y, Field3D& z) : x(x), y(y), z(z) {}
     };
 
     struct TokamakOptions {
@@ -31,7 +31,7 @@ namespace bout {
         FieldMetric dx;
         std::vector<double> toroidal_angles;
 
-        TokamakOptions(Mesh &mesh);
+        TokamakOptions(Mesh& mesh);
 
         void normalise(BoutReal Lbar, BoutReal Bbar, BoutReal ShearFactor);
 

From bf20998417128b33698f6d4cedfcc757a132630e Mon Sep 17 00:00:00 2001
From: tomc271 <tomc271@gmail.com>
Date: Wed, 21 May 2025 20:39:42 +0100
Subject: [PATCH 058/129] FakeMeshFixture has nx=3, ny=5, nz=7

---
 tests/unit/mesh/test_change_coordinate_system.cxx | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/unit/mesh/test_change_coordinate_system.cxx b/tests/unit/mesh/test_change_coordinate_system.cxx
index cf954bd51f..f84c6db6f0 100644
--- a/tests/unit/mesh/test_change_coordinate_system.cxx
+++ b/tests/unit/mesh/test_change_coordinate_system.cxx
@@ -18,8 +18,8 @@ class CoordinateTransformTest : public FakeMeshFixture {
 TEST_F(CoordinateTransformTest, CylindricalToCartesian) {
 
     const double R0 = 2.0;  // major radius
-    const std::array<double, 5> r_values = {0.10, 0.15, 0.20, 0.25, 0.30};  // minor radius
-    const std::array<double, 4> theta_values = {0.0, 1.07712, 3.17151, 5.26591};  // poloidal angle
+    const std::array<double, 3> r_values = {0.1, 0.2, 0.3};  // minor radius
+    const std::array<double, 5> theta_values = {0.0, 1.25663, 2.51327, 3.76991, 5.02654};  // poloidal angle
 
     auto tokamak_options = bout::TokamakOptions(*mesh);
 

From 7296f4b72e5693476fd9a06b5e30d5adfe574303 Mon Sep 17 00:00:00 2001
From: tomc271 <tomc271@gmail.com>
Date: Wed, 21 May 2025 21:10:15 +0100
Subject: [PATCH 059/129] Use nx and ny variables, to avoid magic numbers

---
 tests/unit/mesh/test_change_coordinate_system.cxx | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/unit/mesh/test_change_coordinate_system.cxx b/tests/unit/mesh/test_change_coordinate_system.cxx
index f84c6db6f0..4215ff04eb 100644
--- a/tests/unit/mesh/test_change_coordinate_system.cxx
+++ b/tests/unit/mesh/test_change_coordinate_system.cxx
@@ -18,8 +18,8 @@ class CoordinateTransformTest : public FakeMeshFixture {
 TEST_F(CoordinateTransformTest, CylindricalToCartesian) {
 
     const double R0 = 2.0;  // major radius
-    const std::array<double, 3> r_values = {0.1, 0.2, 0.3};  // minor radius
-    const std::array<double, 5> theta_values = {0.0, 1.25663, 2.51327, 3.76991, 5.02654};  // poloidal angle
+    const std::array<double, nx> r_values = {0.1, 0.2, 0.3};  // minor radius
+    const std::array<double, ny> theta_values = {0.0, 1.25663, 2.51327, 3.76991, 5.02654};  // poloidal angle
 
     auto tokamak_options = bout::TokamakOptions(*mesh);
 

From 19d64545f22812fa78dbe7461bffe0c39ffa4ce2 Mon Sep 17 00:00:00 2001
From: tomc271 <tomc271@gmail.com>
Date: Wed, 21 May 2025 21:36:11 +0100
Subject: [PATCH 060/129] Bug fix: toroidal angle is not an int

---
 src/mesh/tokamak_coordinates.cxx | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/mesh/tokamak_coordinates.cxx b/src/mesh/tokamak_coordinates.cxx
index a8ceab74f1..cc81358833 100644
--- a/src/mesh/tokamak_coordinates.cxx
+++ b/src/mesh/tokamak_coordinates.cxx
@@ -43,7 +43,7 @@ namespace bout {
         for (int i = 0; i < Rxy.getNx(); i++) {
             for (int j = 0; j < Rxy.getNy(); j++) {
                 int k = 0;
-                for (int angle : toroidal_angles) {
+                for (auto angle : toroidal_angles) {
                     x(i, j, k) = Rxy(i, j) * std::cos(angle);
                     y(i, j, k) = Rxy(i, j) * std::sin(angle);
                     z(i, j, k) = Zxy(i, j);

From f5d3abe8572f82ebc5aee025b2bd66d618c0776f Mon Sep 17 00:00:00 2001
From: Ben Dudson <dudson2@llnl.gov>
Date: Wed, 21 May 2025 20:43:49 -0700
Subject: [PATCH 061/129] cvode: Add linear_solver option

Selects the linear solver to be used by CVODE. Usually the default
GMRES works well, but FGMRES can work better.

Example:

```
[solver]
linear_solver = fgmres
```
---
 manual/sphinx/user_docs/time_integration.rst |  3 +++
 src/solver/impls/cvode/cvode.cxx             | 25 +++++++++++++++++++-
 2 files changed, 27 insertions(+), 1 deletion(-)

diff --git a/manual/sphinx/user_docs/time_integration.rst b/manual/sphinx/user_docs/time_integration.rst
index a4db823369..c1526c14e2 100644
--- a/manual/sphinx/user_docs/time_integration.rst
+++ b/manual/sphinx/user_docs/time_integration.rst
@@ -165,6 +165,9 @@ nonlinear solvers:
   `CVodeSetEpsLin
   <https://sundials.readthedocs.io/en/latest/cvodes/Usage/SIM.html#c.CVodeSetEpsLin>`_.
 
+The linear solver type can be set using the ``linear_solver`` option.
+Valid choices include ``gmres`` (the default), ``fgmres``, ``tfqmr``, ``bcgs``.
+
 IMEX-BDF2
 ---------
 
diff --git a/src/solver/impls/cvode/cvode.cxx b/src/solver/impls/cvode/cvode.cxx
index f0d42d39bc..8b81a66f6d 100644
--- a/src/solver/impls/cvode/cvode.cxx
+++ b/src/solver/impls/cvode/cvode.cxx
@@ -51,6 +51,10 @@
 #include <cvode/cvode_bbdpre.h>
 #include <cvode/cvode_ls.h>
 
+#include <sunlinsol/sunlinsol_spbcgs.h>
+#include <sunlinsol/sunlinsol_spfgmr.h>
+#include <sunlinsol/sunlinsol_sptfqmr.h>
+
 #include <algorithm>
 #include <iterator>
 #include <numeric>
@@ -59,6 +63,8 @@
 BOUT_ENUM_CLASS(positivity_constraint, none, positive, non_negative, negative,
                 non_positive);
 
+BOUT_ENUM_CLASS(linear_solver, gmres, fgmres, tfqmr, bcgs);
+
 // NOLINTBEGIN(readability-identifier-length)
 namespace {
 int cvode_linear_rhs(BoutReal t, N_Vector u, N_Vector du, void* user_data);
@@ -344,7 +350,24 @@ int CvodeSolver::init() {
 
     const auto prectype =
         use_precon ? (rightprec ? SUN_PREC_RIGHT : SUN_PREC_LEFT) : SUN_PREC_NONE;
-    sun_solver = callWithSUNContext(SUNLinSol_SPGMR, suncontext, uvec, prectype, maxl);
+
+    switch ((*options)["linear_solver"]
+                .doc("Set linear solver type. Default is gmres.")
+                .withDefault(linear_solver::gmres)) {
+    case linear_solver::gmres:
+      sun_solver = callWithSUNContext(SUNLinSol_SPGMR, suncontext, uvec, prectype, maxl);
+      break;
+    case linear_solver::fgmres:
+      sun_solver = callWithSUNContext(SUNLinSol_SPFGMR, suncontext, uvec, prectype, maxl);
+      break;
+    case linear_solver::tfqmr:
+      sun_solver =
+          callWithSUNContext(SUNLinSol_SPTFQMR, suncontext, uvec, prectype, maxl);
+      break;
+    case linear_solver::bcgs:
+      sun_solver = callWithSUNContext(SUNLinSol_SPBCGS, suncontext, uvec, prectype, maxl);
+      break;
+    };
     if (sun_solver == nullptr) {
       throw BoutException("Creating SUNDIALS linear solver failed\n");
     }

From b9757cd3e271139bb1bd49b12595435b4c1b7020 Mon Sep 17 00:00:00 2001
From: tomc271 <tomc271@gmail.com>
Date: Thu, 22 May 2025 10:23:25 +0100
Subject: [PATCH 062/129] Add explanatory comments to test

---
 tests/unit/mesh/test_change_coordinate_system.cxx | 8 ++++++++
 1 file changed, 8 insertions(+)

diff --git a/tests/unit/mesh/test_change_coordinate_system.cxx b/tests/unit/mesh/test_change_coordinate_system.cxx
index 4215ff04eb..342b4a3115 100644
--- a/tests/unit/mesh/test_change_coordinate_system.cxx
+++ b/tests/unit/mesh/test_change_coordinate_system.cxx
@@ -17,6 +17,12 @@ class CoordinateTransformTest : public FakeMeshFixture {
 
 TEST_F(CoordinateTransformTest, CylindricalToCartesian) {
 
+    // arrange
+
+    // Set up test values
+    // Calculate cylindrical coordinates (Rxy, Zxy)
+    // from (2D) orthogonal poloidal coordinates (r, theta)
+
     const double R0 = 2.0;  // major radius
     const std::array<double, nx> r_values = {0.1, 0.2, 0.3};  // minor radius
     const std::array<double, ny> theta_values = {0.0, 1.25663, 2.51327, 3.76991, 5.02654};  // poloidal angle
@@ -34,8 +40,10 @@ TEST_F(CoordinateTransformTest, CylindricalToCartesian) {
         i++;
     }
 
+    // act
     bout::Coordinates3D cartesian_coords = tokamak_options.CylindricalCoordinatesToCartesian();
 
+    // assert
     for (int jx = 0; jx < mesh->xend; jx++) {
         for (int jy = 0; jy < mesh->yend; jy++) {
             for (int jz = 0; jz < mesh->LocalNz; jz++) {

From 0fb5b3f5ede5d5b48a96469ca0ea88de16fe767c Mon Sep 17 00:00:00 2001
From: tomc271 <tomc271@gmail.com>
Date: Thu, 22 May 2025 13:08:51 +0100
Subject: [PATCH 063/129] Don't instantiate Field3D from Field2D

---
 src/mesh/tokamak_coordinates.cxx | 9 ++++++---
 1 file changed, 6 insertions(+), 3 deletions(-)

diff --git a/src/mesh/tokamak_coordinates.cxx b/src/mesh/tokamak_coordinates.cxx
index cc81358833..740d19e325 100644
--- a/src/mesh/tokamak_coordinates.cxx
+++ b/src/mesh/tokamak_coordinates.cxx
@@ -37,9 +37,12 @@ namespace bout {
     }
 
     Coordinates3D TokamakOptions::CylindricalCoordinatesToCartesian() {
-        Field3D x = emptyFrom(Rxy);
-        Field3D y = emptyFrom(Rxy);
-        Field3D z = emptyFrom(Zxy);
+
+        auto* mesh = Rxy.getMesh();
+        Field3D x = Field3D(0.0, mesh);
+        Field3D y = Field3D(0.0, mesh);
+        Field3D z = Field3D(0.0, mesh);
+
         for (int i = 0; i < Rxy.getNx(); i++) {
             for (int j = 0; j < Rxy.getNy(); j++) {
                 int k = 0;

From 02d4cbfe246ed9002ce44d24007e7edf28be54d1 Mon Sep 17 00:00:00 2001
From: tomc271 <tomc271@gmail.com>
Date: Thu, 22 May 2025 13:09:29 +0100
Subject: [PATCH 064/129] Just test min and max values

---
 .../mesh/test_change_coordinate_system.cxx    | 43 ++++++++++++-------
 1 file changed, 27 insertions(+), 16 deletions(-)

diff --git a/tests/unit/mesh/test_change_coordinate_system.cxx b/tests/unit/mesh/test_change_coordinate_system.cxx
index 342b4a3115..3777beb3f1 100644
--- a/tests/unit/mesh/test_change_coordinate_system.cxx
+++ b/tests/unit/mesh/test_change_coordinate_system.cxx
@@ -25,7 +25,12 @@ TEST_F(CoordinateTransformTest, CylindricalToCartesian) {
 
     const double R0 = 2.0;  // major radius
     const std::array<double, nx> r_values = {0.1, 0.2, 0.3};  // minor radius
-    const std::array<double, ny> theta_values = {0.0, 1.25663, 2.51327, 3.76991, 5.02654};  // poloidal angle
+    const std::array<double, ny> theta_values = {  // poloidal angle
+            0.0,
+            PI / 2,
+            PI,
+            3 * PI / 2,
+            2 * PI};
 
     auto tokamak_options = bout::TokamakOptions(*mesh);
 
@@ -44,22 +49,28 @@ TEST_F(CoordinateTransformTest, CylindricalToCartesian) {
     bout::Coordinates3D cartesian_coords = tokamak_options.CylindricalCoordinatesToCartesian();
 
     // assert
-    for (int jx = 0; jx < mesh->xend; jx++) {
-        for (int jy = 0; jy < mesh->yend; jy++) {
-            for (int jz = 0; jz < mesh->LocalNz; jz++) {
+    const auto max_r = *std::max_element(begin(r_values), end(r_values));
+    const auto expected_max_x = R0 + max_r;
+    // With nz=7, there is no toroidal coordinate point at exactly pi/2; the nearest point is at 2/7 * 2pi
+    const auto expected_max_y = (R0 + max_r) * std::sin(TWOPI * 2 / 7);
+    const auto expected_max_z = max_r;
 
-                auto actual_x = cartesian_coords.x(jx, jy, jz);
-                auto actual_y = cartesian_coords.y(jx, jy, jz);
-                auto actual_z = cartesian_coords.z(jx, jy, jz);
+    // With nz=7, there is no toroidal coordinate point at exactly pi; the nearest point is at 3/7 * 2pi
+    const auto expected_min_x = -1 * (R0 + max_r) * std::cos(TWOPI / 7 / 2);
+    const auto expected_min_y = -1 * (R0 + max_r) * std::sin(TWOPI * 2 / 7);
+    const auto expected_min_z = -1 * expected_max_z;
 
-                auto expected_x = tokamak_options.Rxy(jx, jy) * std::cos(tokamak_options.toroidal_angles[jz]);
-                auto expected_y = tokamak_options.Rxy(jx, jy) * std::sin(tokamak_options.toroidal_angles[jz]);
-                auto expected_z = tokamak_options.Zxy(jx, jy);
+    const auto actual_max_x = max(cartesian_coords.x, false, "RGN_ALL");
+    const auto actual_max_y = max(cartesian_coords.y, false, "RGN_ALL");
+    const auto actual_max_z = max(cartesian_coords.z, false, "RGN_ALL");
+    const auto actual_min_x = min(cartesian_coords.x, false, "RGN_ALL");
+    const auto actual_min_y = min(cartesian_coords.y, false, "RGN_ALL");
+    const auto actual_min_z = min(cartesian_coords.z, false, "RGN_ALL");
 
-                EXPECT_EQ(actual_x, expected_x);
-                EXPECT_EQ(actual_y, expected_y);
-                EXPECT_EQ(actual_z, expected_z);
-            }
-        }
-    }
+    EXPECT_EQ(expected_max_x, actual_max_x);
+    EXPECT_EQ(expected_max_y, actual_max_y);
+    EXPECT_EQ(expected_max_z, actual_max_z);
+    EXPECT_EQ(expected_min_x, actual_min_x);
+    EXPECT_EQ(expected_min_y, actual_min_y);
+    EXPECT_EQ(expected_min_z, actual_min_z);
 }

From 3853d3dca954e42001dd1231eaae6631c35a2426 Mon Sep 17 00:00:00 2001
From: Ben Dudson <dudson2@llnl.gov>
Date: Tue, 27 May 2025 16:38:01 -0700
Subject: [PATCH 065/129] Use python f-strings

Cleans up test code

Co-authored-by: David Bold <dschwoerer@users.noreply.github.com>
---
 tests/integrated/test-laplace-hypre3d/runtest | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/integrated/test-laplace-hypre3d/runtest b/tests/integrated/test-laplace-hypre3d/runtest
index f1f5950547..89acf79364 100755
--- a/tests/integrated/test-laplace-hypre3d/runtest
+++ b/tests/integrated/test-laplace-hypre3d/runtest
@@ -29,10 +29,10 @@ for directory, nproc in test_directories:
     error_max = collect("error_max", path=directory, info=False)
 
     if error_max > tolerance:
-        print(" => " + directory + " failed with maximum error {}".format(error_max))
+        print(f" => {directory} failed with maximum error {error_max}")
         success = False
     else:
-        print(" => " + directory + " passed with maximum error {}".format(error_max))
+        print(f" => {directory} passed with maximum error {error_max}")
 
 if success:
     print("=> All passed")

From a7771c5ab4e2f0aa5eacf524b89b23e1934be0b4 Mon Sep 17 00:00:00 2001
From: Steven Roberts <roberts115@llnl.gov>
Date: Thu, 29 May 2025 23:20:59 -0700
Subject: [PATCH 066/129] Fix bug where ARKODE considered all problems linear

---
 src/solver/impls/arkode/arkode.cxx | 8 +++++---
 1 file changed, 5 insertions(+), 3 deletions(-)

diff --git a/src/solver/impls/arkode/arkode.cxx b/src/solver/impls/arkode/arkode.cxx
index 23883cc043..6f20ce11a6 100644
--- a/src/solver/impls/arkode/arkode.cxx
+++ b/src/solver/impls/arkode/arkode.cxx
@@ -229,9 +229,11 @@ int ArkodeSolver::init() {
     throw BoutException("ARKodeSetUserData failed\n");
   }
 
-  if (ARKodeSetLinear(arkode_mem, static_cast<int>(set_linear))
-      != ARK_SUCCESS) {
-    throw BoutException("ARKodeSetLinear failed\n");
+  if (set_linear) {
+    constexpr bool is_time_dep = false;
+    if (ARKodeSetLinear(arkode_mem, is_time_dep) != ARK_SUCCESS) {
+      throw BoutException("ARKodeSetLinear failed\n");
+    }
   }
 
   if (fixed_step) {

From 6b1d6f48a977e31795931f65f99a0078a7cdcb48 Mon Sep 17 00:00:00 2001
From: David Bold <dave@ipp.mpg.de>
Date: Tue, 3 Jun 2025 11:52:56 +0200
Subject: [PATCH 067/129] Fix call depending on PETSc version

---
 src/solver/impls/imex-bdf2/imex-bdf2.cxx | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/src/solver/impls/imex-bdf2/imex-bdf2.cxx b/src/solver/impls/imex-bdf2/imex-bdf2.cxx
index 853d8eaf12..07d3b6ca1b 100644
--- a/src/solver/impls/imex-bdf2/imex-bdf2.cxx
+++ b/src/solver/impls/imex-bdf2/imex-bdf2.cxx
@@ -652,7 +652,13 @@ void IMEXBDF2::constructSNES(SNES* snesIn) {
       MatFDColoringCreate(Jmf, iscoloring, &fdcoloring);
       // Set the function to difference
       MatFDColoringSetFunction(
-          fdcoloring, reinterpret_cast<PetscErrorCode (*)()>(FormFunctionForColoring),
+          fdcoloring,
+#if (PETSC_VERSION_GE(3,24,0) || \
+   (PETSC_VERSION_GE(3,23,0) && PETSC_VERSION_RELEASE == 0)
+          reinterpret_cast<MatFDColoringFn>(FormFunctionForColoring),
+#else
+          reinterpret_cast<PetscErrorCode (*)()>(FormFunctionForColoring),
+#endif
           this);
       MatFDColoringSetFromOptions(fdcoloring);
       MatFDColoringSetUp(Jmf, iscoloring, fdcoloring);

From d8fd1b546e09d60c91e3b1f9650ced2692ea0ae5 Mon Sep 17 00:00:00 2001
From: David Bold <dave@ipp.mpg.de>
Date: Tue, 3 Jun 2025 12:00:06 +0200
Subject: [PATCH 068/129] Remove extra (

---
 src/solver/impls/imex-bdf2/imex-bdf2.cxx | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/solver/impls/imex-bdf2/imex-bdf2.cxx b/src/solver/impls/imex-bdf2/imex-bdf2.cxx
index 07d3b6ca1b..f39a73eee2 100644
--- a/src/solver/impls/imex-bdf2/imex-bdf2.cxx
+++ b/src/solver/impls/imex-bdf2/imex-bdf2.cxx
@@ -653,7 +653,7 @@ void IMEXBDF2::constructSNES(SNES* snesIn) {
       // Set the function to difference
       MatFDColoringSetFunction(
           fdcoloring,
-#if (PETSC_VERSION_GE(3,24,0) || \
+#if PETSC_VERSION_GE(3,24,0) || \
    (PETSC_VERSION_GE(3,23,0) && PETSC_VERSION_RELEASE == 0)
           reinterpret_cast<MatFDColoringFn>(FormFunctionForColoring),
 #else

From 651d41d302f9a2b748ef47bb8171c106f511a6a8 Mon Sep 17 00:00:00 2001
From: David Bold <dave@ipp.mpg.de>
Date: Tue, 3 Jun 2025 12:28:04 +0200
Subject: [PATCH 069/129] Update function signature to avoid cast

---
 src/solver/impls/imex-bdf2/imex-bdf2.cxx | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/solver/impls/imex-bdf2/imex-bdf2.cxx b/src/solver/impls/imex-bdf2/imex-bdf2.cxx
index f39a73eee2..f4e3a02327 100644
--- a/src/solver/impls/imex-bdf2/imex-bdf2.cxx
+++ b/src/solver/impls/imex-bdf2/imex-bdf2.cxx
@@ -95,7 +95,7 @@ IMEXBDF2::~IMEXBDF2() {
  * This function assumes the context void pointer is a pointer
  * to an IMEXBDF2 object.
  */
-static PetscErrorCode FormFunction(SNES UNUSED(snes), Vec x, Vec f, void* ctx) {
+static PetscErrorCode FormFunction(void* UNUSED(snes), Vec x, Vec f, void* ctx) {
   return static_cast<IMEXBDF2*>(ctx)->snes_function(x, f, false);
 }
 
@@ -113,7 +113,7 @@ static PetscErrorCode FormFunctionForDifferencing(void* ctx, Vec x, Vec f) {
  *
  * This can be a linearised and simplified form of FormFunction
  */
-static PetscErrorCode FormFunctionForColoring(SNES UNUSED(snes), Vec x, Vec f,
+static PetscErrorCode FormFunctionForColoring(void* UNUSED(snes), Vec x, Vec f,
                                               void* ctx) {
   return static_cast<IMEXBDF2*>(ctx)->snes_function(x, f, true);
 }
@@ -655,7 +655,7 @@ void IMEXBDF2::constructSNES(SNES* snesIn) {
           fdcoloring,
 #if PETSC_VERSION_GE(3,24,0) || \
    (PETSC_VERSION_GE(3,23,0) && PETSC_VERSION_RELEASE == 0)
-          reinterpret_cast<MatFDColoringFn>(FormFunctionForColoring),
+          FormFunctionForColoring,
 #else
           reinterpret_cast<PetscErrorCode (*)()>(FormFunctionForColoring),
 #endif

From 88c34feec7bef59af931a2acb0f061d39e7b6d2d Mon Sep 17 00:00:00 2001
From: David Bold <dave@ipp.mpg.de>
Date: Tue, 3 Jun 2025 12:34:46 +0200
Subject: [PATCH 070/129] Revert modification of wrong function

---
 src/solver/impls/imex-bdf2/imex-bdf2.cxx | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/solver/impls/imex-bdf2/imex-bdf2.cxx b/src/solver/impls/imex-bdf2/imex-bdf2.cxx
index f4e3a02327..5ef1288a32 100644
--- a/src/solver/impls/imex-bdf2/imex-bdf2.cxx
+++ b/src/solver/impls/imex-bdf2/imex-bdf2.cxx
@@ -95,7 +95,7 @@ IMEXBDF2::~IMEXBDF2() {
  * This function assumes the context void pointer is a pointer
  * to an IMEXBDF2 object.
  */
-static PetscErrorCode FormFunction(void* UNUSED(snes), Vec x, Vec f, void* ctx) {
+static PetscErrorCode FormFunction(SNES UNUSED(snes), Vec x, Vec f, void* ctx) {
   return static_cast<IMEXBDF2*>(ctx)->snes_function(x, f, false);
 }
 

From 1ead0446b71f81f6dcb63a2b3f47a3cc0fa4db15 Mon Sep 17 00:00:00 2001
From: David Bold <dave@ipp.mpg.de>
Date: Wed, 4 Jun 2025 12:16:39 +0200
Subject: [PATCH 071/129] Adjust petsc solver for petsc changes

---
 src/solver/impls/petsc/petsc.cxx | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/src/solver/impls/petsc/petsc.cxx b/src/solver/impls/petsc/petsc.cxx
index 090087d0de..585fec5d71 100644
--- a/src/solver/impls/petsc/petsc.cxx
+++ b/src/solver/impls/petsc/petsc.cxx
@@ -515,7 +515,13 @@ int PetscSolver::init() {
   ierr = ISColoringDestroy(&iscoloring);
   CHKERRQ(ierr);
   ierr = MatFDColoringSetFunction(matfdcoloring,
-                                  reinterpret_cast<PetscErrorCode (*)()>(solver_f), this);
+#if PETSC_VERSION_GE(3,24,0) || \
+   (PETSC_VERSION_GE(3,23,0) && PETSC_VERSION_RELEASE == 0)
+                                  solver_f,
+#else
+                                  reinterpret_cast<PetscErrorCode (*)()>(solver_f),
+#endif
+                                  this);
   CHKERRQ(ierr);
   ierr = SNESSetJacobian(snes, J, J, SNESComputeJacobianDefaultColor, matfdcoloring);
   CHKERRQ(ierr);

From 1bd95ddb9470718f5204969bcc8a2edbbb10ce38 Mon Sep 17 00:00:00 2001
From: David Bold <dave@ipp.mpg.de>
Date: Wed, 4 Jun 2025 13:57:59 +0200
Subject: [PATCH 072/129] Adopt snes.cxx for newest petsc changes

---
 src/solver/impls/snes/snes.cxx | 11 +++++++++--
 1 file changed, 9 insertions(+), 2 deletions(-)

diff --git a/src/solver/impls/snes/snes.cxx b/src/solver/impls/snes/snes.cxx
index 4dce1e7086..32407d861f 100644
--- a/src/solver/impls/snes/snes.cxx
+++ b/src/solver/impls/snes/snes.cxx
@@ -1291,8 +1291,15 @@ void SNESSolver::updateColoring() {
   // Replace the old coloring with the new one
   MatFDColoringDestroy(&fdcoloring);
   MatFDColoringCreate(Jfd, iscoloring, &fdcoloring);
-  MatFDColoringSetFunction(
-      fdcoloring, reinterpret_cast<PetscErrorCode (*)()>(FormFunctionForColoring), this);
+  MatFDColoringSetFunction(fdcoloring,
+#if PETSC_VERSION_GE(3, 24, 0) \
+    || (PETSC_VERSION_GE(3, 23, 0) && PETSC_VERSION_RELEASE == 0)
+                           FormFunctionForColoring,
+#else
+                           reinterpret_cast<PetscErrorCode (*)()>(
+                               FormFunctionForColoring),
+#endif
+                           this);
   MatFDColoringSetFromOptions(fdcoloring);
   MatFDColoringSetUp(Jfd, iscoloring, fdcoloring);
   ISColoringDestroy(&iscoloring);

From 04338cdb156330fa1b81f024dd6db7aa443ed2e3 Mon Sep 17 00:00:00 2001
From: David Bold <dave@ipp.mpg.de>
Date: Thu, 5 Jun 2025 00:56:05 +0200
Subject: [PATCH 073/129] coloring for petsc solver is very likely broken

---
 src/solver/impls/petsc/petsc.cxx | 10 +---------
 1 file changed, 1 insertion(+), 9 deletions(-)

diff --git a/src/solver/impls/petsc/petsc.cxx b/src/solver/impls/petsc/petsc.cxx
index 585fec5d71..dd63811f0f 100644
--- a/src/solver/impls/petsc/petsc.cxx
+++ b/src/solver/impls/petsc/petsc.cxx
@@ -514,15 +514,7 @@ int PetscSolver::init() {
   CHKERRQ(ierr);
   ierr = ISColoringDestroy(&iscoloring);
   CHKERRQ(ierr);
-  ierr = MatFDColoringSetFunction(matfdcoloring,
-#if PETSC_VERSION_GE(3,24,0) || \
-   (PETSC_VERSION_GE(3,23,0) && PETSC_VERSION_RELEASE == 0)
-                                  solver_f,
-#else
-                                  reinterpret_cast<PetscErrorCode (*)()>(solver_f),
-#endif
-                                  this);
-  CHKERRQ(ierr);
+  throw BoutException("Coloring is not working");
   ierr = SNESSetJacobian(snes, J, J, SNESComputeJacobianDefaultColor, matfdcoloring);
   CHKERRQ(ierr);
 

From c84a2fc64caa10b7fb61262749c2f589646a5201 Mon Sep 17 00:00:00 2001
From: David Bold <dave@ipp.mpg.de>
Date: Thu, 5 Jun 2025 10:26:47 +0200
Subject: [PATCH 074/129] Cast to fix first argument from SNES to void*

---
 src/solver/impls/snes/snes.cxx | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/solver/impls/snes/snes.cxx b/src/solver/impls/snes/snes.cxx
index 32407d861f..601c537994 100644
--- a/src/solver/impls/snes/snes.cxx
+++ b/src/solver/impls/snes/snes.cxx
@@ -1294,7 +1294,8 @@ void SNESSolver::updateColoring() {
   MatFDColoringSetFunction(fdcoloring,
 #if PETSC_VERSION_GE(3, 24, 0) \
     || (PETSC_VERSION_GE(3, 23, 0) && PETSC_VERSION_RELEASE == 0)
-                           FormFunctionForColoring,
+                           reinterpret_cast<PetscErrorCode (*)(void*, Vec, Vec, void*)>(
+                               FormFunctionForColoring),
 #else
                            reinterpret_cast<PetscErrorCode (*)()>(
                                FormFunctionForColoring),

From 4b09458aee554baae391bcc6b9362cc1f67c600a Mon Sep 17 00:00:00 2001
From: dschwoerer <5637662+dschwoerer@users.noreply.github.com>
Date: Thu, 5 Jun 2025 10:03:47 +0000
Subject: [PATCH 075/129] Apply clang-format changes

---
 src/solver/impls/imex-bdf2/imex-bdf2.cxx | 14 +++++++-------
 1 file changed, 7 insertions(+), 7 deletions(-)

diff --git a/src/solver/impls/imex-bdf2/imex-bdf2.cxx b/src/solver/impls/imex-bdf2/imex-bdf2.cxx
index 5ef1288a32..91bded7b17 100644
--- a/src/solver/impls/imex-bdf2/imex-bdf2.cxx
+++ b/src/solver/impls/imex-bdf2/imex-bdf2.cxx
@@ -651,15 +651,15 @@ void IMEXBDF2::constructSNES(SNES* snesIn) {
       // Create data structure for SNESComputeJacobianDefaultColor
       MatFDColoringCreate(Jmf, iscoloring, &fdcoloring);
       // Set the function to difference
-      MatFDColoringSetFunction(
-          fdcoloring,
-#if PETSC_VERSION_GE(3,24,0) || \
-   (PETSC_VERSION_GE(3,23,0) && PETSC_VERSION_RELEASE == 0)
-          FormFunctionForColoring,
+      MatFDColoringSetFunction(fdcoloring,
+#if PETSC_VERSION_GE(3, 24, 0) \
+    || (PETSC_VERSION_GE(3, 23, 0) && PETSC_VERSION_RELEASE == 0)
+                               FormFunctionForColoring,
 #else
-          reinterpret_cast<PetscErrorCode (*)()>(FormFunctionForColoring),
+                               reinterpret_cast<PetscErrorCode (*)()>(
+                                   FormFunctionForColoring),
 #endif
-          this);
+                               this);
       MatFDColoringSetFromOptions(fdcoloring);
       MatFDColoringSetUp(Jmf, iscoloring, fdcoloring);
       ISColoringDestroy(&iscoloring);

From 22e2e84d0c605a7fef74fbd251ca86bdafba223d Mon Sep 17 00:00:00 2001
From: David Bold <dave@ipp.mpg.de>
Date: Fri, 6 Jun 2025 11:40:56 +0200
Subject: [PATCH 076/129] Cleanup casting

Avoid #if preprocessing in function calls
---
 include/bout/petsc_interface.hxx         |  7 +++++++
 src/solver/impls/imex-bdf2/imex-bdf2.cxx | 10 +++++-----
 src/solver/impls/snes/snes.cxx           | 12 ++----------
 3 files changed, 14 insertions(+), 15 deletions(-)

diff --git a/include/bout/petsc_interface.hxx b/include/bout/petsc_interface.hxx
index 1378419872..ce12b16804 100644
--- a/include/bout/petsc_interface.hxx
+++ b/include/bout/petsc_interface.hxx
@@ -566,6 +566,13 @@ PetscVector<T> operator*(const PetscMatrix<T>& mat, const PetscVector<T>& vec) {
   return PetscVector<T>(vec, result);
 }
 
+// Compatibility wrappers
+// For < 3.24
+#if PETSC_VERSION_LE(3, 22, 0) \
+    || (PETSC_VERSION_GE(3, 23, 0) && PETSC_VERSION_RELEASE == 0)
+using MatFDColoringFn = PetscErrorCode (*)();
+#endif
+
 #endif // BOUT_HAS_PETSC
 
 #endif // BOUT_PETSC_INTERFACE_H
diff --git a/src/solver/impls/imex-bdf2/imex-bdf2.cxx b/src/solver/impls/imex-bdf2/imex-bdf2.cxx
index 91bded7b17..8126ab6f37 100644
--- a/src/solver/impls/imex-bdf2/imex-bdf2.cxx
+++ b/src/solver/impls/imex-bdf2/imex-bdf2.cxx
@@ -651,15 +651,15 @@ void IMEXBDF2::constructSNES(SNES* snesIn) {
       // Create data structure for SNESComputeJacobianDefaultColor
       MatFDColoringCreate(Jmf, iscoloring, &fdcoloring);
       // Set the function to difference
-      MatFDColoringSetFunction(fdcoloring,
-#if PETSC_VERSION_GE(3, 24, 0) \
+#if PETSC_VERSION_LE(3, 22, 0) \
     || (PETSC_VERSION_GE(3, 23, 0) && PETSC_VERSION_RELEASE == 0)
-                               FormFunctionForColoring,
+#define FUNC_MAYBE_CAST(func) reinterpret_cast<MatFDColoringFn>(func)
 #else
-                               reinterpret_cast<PetscErrorCode (*)()>(
-                                   FormFunctionForColoring),
+#define FUNC_MAYBE_CAST(func) func
 #endif
+      MatFDColoringSetFunction(fdcoloring, FUNC_MAYBE_CAST(FormFunctionForColoring),
                                this);
+#undef FUNC_MAYBE_CAST
       MatFDColoringSetFromOptions(fdcoloring);
       MatFDColoringSetUp(Jmf, iscoloring, fdcoloring);
       ISColoringDestroy(&iscoloring);
diff --git a/src/solver/impls/snes/snes.cxx b/src/solver/impls/snes/snes.cxx
index 601c537994..e280ed09fa 100644
--- a/src/solver/impls/snes/snes.cxx
+++ b/src/solver/impls/snes/snes.cxx
@@ -1291,16 +1291,8 @@ void SNESSolver::updateColoring() {
   // Replace the old coloring with the new one
   MatFDColoringDestroy(&fdcoloring);
   MatFDColoringCreate(Jfd, iscoloring, &fdcoloring);
-  MatFDColoringSetFunction(fdcoloring,
-#if PETSC_VERSION_GE(3, 24, 0) \
-    || (PETSC_VERSION_GE(3, 23, 0) && PETSC_VERSION_RELEASE == 0)
-                           reinterpret_cast<PetscErrorCode (*)(void*, Vec, Vec, void*)>(
-                               FormFunctionForColoring),
-#else
-                           reinterpret_cast<PetscErrorCode (*)()>(
-                               FormFunctionForColoring),
-#endif
-                           this);
+  MatFDColoringSetFunction(
+      fdcoloring, reinterpret_cast<MatFDColoringFn>(FormFunctionForColoring), this);
   MatFDColoringSetFromOptions(fdcoloring);
   MatFDColoringSetUp(Jfd, iscoloring, fdcoloring);
   ISColoringDestroy(&iscoloring);

From fd386e18ae201c706eb47b20c55fb4c1a3f23c42 Mon Sep 17 00:00:00 2001
From: David Bold <dave@ipp.mpg.de>
Date: Fri, 6 Jun 2025 11:41:57 +0200
Subject: [PATCH 077/129] Update docs for what PETSc we support

3.23 has been tested in CI so is expected to work.
---
 manual/RELEASE_HOWTO.md                      | 1 +
 manual/sphinx/user_docs/advanced_install.rst | 2 +-
 2 files changed, 2 insertions(+), 1 deletion(-)

diff --git a/manual/RELEASE_HOWTO.md b/manual/RELEASE_HOWTO.md
index 4103e6f197..d8ced2afb5 100644
--- a/manual/RELEASE_HOWTO.md
+++ b/manual/RELEASE_HOWTO.md
@@ -51,6 +51,7 @@ Before merging PR:
     - [ ]  [`manual/doxygen/Doxyfile_readthedocs`][Doxyfile_readthedocs]: `PROJECT_NUMBER`
     - [ ]  [`manual/doxygen/Doxyfile`][Doxyfile]: `PROJECT_NUMBER`
     - [ ]  [`CMakeLists.txt`][CMakeLists]: `_bout_previous_version`, `_bout_next_version`
+- [ ] Update what version of PETSc and SUNDIALS we support (upper bound)
 
 
 After PR is merged:
diff --git a/manual/sphinx/user_docs/advanced_install.rst b/manual/sphinx/user_docs/advanced_install.rst
index 048a26a6e3..f8e594be07 100644
--- a/manual/sphinx/user_docs/advanced_install.rst
+++ b/manual/sphinx/user_docs/advanced_install.rst
@@ -355,7 +355,7 @@ BOUT++ can use PETSc https://www.mcs.anl.gov/petsc/ for time-integration
 and for solving elliptic problems, such as inverting Poisson and
 Helmholtz equations.
 
-Currently, BOUT++ supports PETSc versions 3.7 - 3.19. More recent versions may
+Currently, BOUT++ supports PETSc versions 3.7 - 3.23. More recent versions may
 well work, but the PETSc API does sometimes change in backward-incompatible
 ways, so this is not guaranteed. To install PETSc version 3.19, use the
 following steps::

From c4c9b923e87d81c98c8905d7acc23b760d221833 Mon Sep 17 00:00:00 2001
From: David Bold <dave@ipp.mpg.de>
Date: Fri, 6 Jun 2025 11:42:13 +0200
Subject: [PATCH 078/129] Remove old checks

---
 src/solver/impls/imex-bdf2/imex-bdf2.cxx | 5 -----
 1 file changed, 5 deletions(-)

diff --git a/src/solver/impls/imex-bdf2/imex-bdf2.cxx b/src/solver/impls/imex-bdf2/imex-bdf2.cxx
index 8126ab6f37..4c663907df 100644
--- a/src/solver/impls/imex-bdf2/imex-bdf2.cxx
+++ b/src/solver/impls/imex-bdf2/imex-bdf2.cxx
@@ -683,12 +683,7 @@ void IMEXBDF2::constructSNES(SNES* snesIn) {
           0, // Number of nonzeros per row in off-diagonal portion of local submatrix
           nullptr, &Jmf);
 
-#if PETSC_VERSION_GE(3, 4, 0)
       SNESSetJacobian(*snesIn, Jmf, Jmf, SNESComputeJacobianDefault, this);
-#else
-      // Before 3.4
-      SNESSetJacobian(*snesIn, Jmf, Jmf, SNESDefaultComputeJacobian, this);
-#endif
 
       MatSetOption(Jmf, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_FALSE);
     }

From 6506d18436d2ea4530b859ddae844249948c3595 Mon Sep 17 00:00:00 2001
From: David Bold <dave@ipp.mpg.de>
Date: Sun, 8 Jun 2025 21:00:44 +0200
Subject: [PATCH 079/129] Add missing header

---
 src/solver/impls/imex-bdf2/imex-bdf2.cxx | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/solver/impls/imex-bdf2/imex-bdf2.cxx b/src/solver/impls/imex-bdf2/imex-bdf2.cxx
index 4c663907df..6363760e7e 100644
--- a/src/solver/impls/imex-bdf2/imex-bdf2.cxx
+++ b/src/solver/impls/imex-bdf2/imex-bdf2.cxx
@@ -9,6 +9,7 @@
 #include <bout/boutexception.hxx>
 #include <bout/mesh.hxx>
 #include <bout/msg_stack.hxx>
+#include <bout/petsc_interface.hxx>
 #include <bout/utils.hxx>
 
 #include <cmath>

From 6d1db3506aa26e8a144cc9b68ba2cdd9b284644e Mon Sep 17 00:00:00 2001
From: David Bold <dave@ipp.mpg.de>
Date: Sun, 8 Jun 2025 23:20:31 +0200
Subject: [PATCH 080/129] Fix usage of macros

---
 include/bout/petsc_interface.hxx         | 6 ++++--
 src/solver/impls/imex-bdf2/imex-bdf2.cxx | 8 ++++----
 2 files changed, 8 insertions(+), 6 deletions(-)

diff --git a/include/bout/petsc_interface.hxx b/include/bout/petsc_interface.hxx
index ce12b16804..b59e8d9531 100644
--- a/include/bout/petsc_interface.hxx
+++ b/include/bout/petsc_interface.hxx
@@ -568,8 +568,10 @@ PetscVector<T> operator*(const PetscMatrix<T>& mat, const PetscVector<T>& vec) {
 
 // Compatibility wrappers
 // For < 3.24
-#if PETSC_VERSION_LE(3, 22, 0) \
-    || (PETSC_VERSION_GE(3, 23, 0) && PETSC_VERSION_RELEASE == 0)
+#if PETSC_VERSION_GE(3, 24, 0) \
+    || (PETSC_VERSION_GE(3, 23, 0) && PETSC_VERSION_RELEASE != 0)
+// Nothing to do
+#else
 using MatFDColoringFn = PetscErrorCode (*)();
 #endif
 
diff --git a/src/solver/impls/imex-bdf2/imex-bdf2.cxx b/src/solver/impls/imex-bdf2/imex-bdf2.cxx
index 6363760e7e..7b53f18465 100644
--- a/src/solver/impls/imex-bdf2/imex-bdf2.cxx
+++ b/src/solver/impls/imex-bdf2/imex-bdf2.cxx
@@ -652,11 +652,11 @@ void IMEXBDF2::constructSNES(SNES* snesIn) {
       // Create data structure for SNESComputeJacobianDefaultColor
       MatFDColoringCreate(Jmf, iscoloring, &fdcoloring);
       // Set the function to difference
-#if PETSC_VERSION_LE(3, 22, 0) \
-    || (PETSC_VERSION_GE(3, 23, 0) && PETSC_VERSION_RELEASE == 0)
-#define FUNC_MAYBE_CAST(func) reinterpret_cast<MatFDColoringFn>(func)
-#else
+#if PETSC_VERSION_GE(3, 24, 0) \
+    || (PETSC_VERSION_GE(3, 23, 0) && PETSC_VERSION_RELEASE != 0)
 #define FUNC_MAYBE_CAST(func) func
+#else
+#define FUNC_MAYBE_CAST(func) reinterpret_cast<MatFDColoringFn>(func)
 #endif
       MatFDColoringSetFunction(fdcoloring, FUNC_MAYBE_CAST(FormFunctionForColoring),
                                this);

From 086a8b1f48493bbcd11807a36c26e25e90d435ab Mon Sep 17 00:00:00 2001
From: tomc271 <tomc271@gmail.com>
Date: Tue, 10 Jun 2025 12:49:11 +0100
Subject: [PATCH 081/129] Add nx, ny, nz as optional arguments to
 FakeMeshFixture constructor

---
 tests/unit/fake_mesh_fixture.hxx | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/tests/unit/fake_mesh_fixture.hxx b/tests/unit/fake_mesh_fixture.hxx
index 4c33093aee..dcda38de81 100644
--- a/tests/unit/fake_mesh_fixture.hxx
+++ b/tests/unit/fake_mesh_fixture.hxx
@@ -27,13 +27,13 @@
 ///     using MyTest = FakeMeshFixture;
 class FakeMeshFixture : public ::testing::Test {
 public:
-    FakeMeshFixture() {
+    FakeMeshFixture(int nx_ = nx, int ny_ = ny, int nz_ = nz) {
         WithQuietOutput quiet_info{output_info};
         WithQuietOutput quiet_warn{output_warn};
 
         delete bout::globals::mesh;
         bout::globals::mpi = new MpiWrapper();
-        bout::globals::mesh = new FakeMesh(nx, ny, nz);
+        bout::globals::mesh = new FakeMesh(nx_, ny_, nz_);
         bout::globals::mesh->createDefaultRegions();
         static_cast<FakeMesh*>(bout::globals::mesh)->setCoordinates(nullptr);
         test_coords = std::make_shared<Coordinates>(
@@ -71,7 +71,7 @@ public:
         dynamic_cast<FakeMesh*>(bout::globals::mesh)->createBoundaryRegions();
 
         delete mesh_staggered;
-        mesh_staggered = new FakeMesh(nx, ny, nz);
+        mesh_staggered = new FakeMesh(nx_, ny_, nz_);
         mesh_staggered->StaggerGrids = true;
         dynamic_cast<FakeMesh*>(mesh_staggered)->setCoordinates(nullptr);
         dynamic_cast<FakeMesh*>(mesh_staggered)->setCoordinates(nullptr, CELL_XLOW);

From 0d432140fd50f07b68f96f0fe36103590d95c5ed Mon Sep 17 00:00:00 2001
From: tomc271 <tomc271@gmail.com>
Date: Tue, 10 Jun 2025 13:00:30 +0100
Subject: [PATCH 082/129] Use nz=8 in CoordinateTransformTest

so that there will be a toroidal point at pi/2.
---
 .../unit/mesh/test_change_coordinate_system.cxx | 17 +++++++++--------
 1 file changed, 9 insertions(+), 8 deletions(-)

diff --git a/tests/unit/mesh/test_change_coordinate_system.cxx b/tests/unit/mesh/test_change_coordinate_system.cxx
index 3777beb3f1..c2a36ed18a 100644
--- a/tests/unit/mesh/test_change_coordinate_system.cxx
+++ b/tests/unit/mesh/test_change_coordinate_system.cxx
@@ -5,6 +5,9 @@
 #include "bout/constants.hxx"
 #include <bout/tokamak_coordinates.hxx>
 
+static constexpr int NX = 3;
+static constexpr int NY = 5;
+static constexpr int NZ = 8;
 
 using bout::globals::mesh;
 
@@ -12,7 +15,7 @@ class CoordinateTransformTest : public FakeMeshFixture {
 public:
     using FieldMetric = Coordinates::FieldMetric;
 
-    CoordinateTransformTest() : FakeMeshFixture() {}
+    CoordinateTransformTest() : FakeMeshFixture(NX, NY, NZ) {}
 };
 
 TEST_F(CoordinateTransformTest, CylindricalToCartesian) {
@@ -24,8 +27,8 @@ TEST_F(CoordinateTransformTest, CylindricalToCartesian) {
     // from (2D) orthogonal poloidal coordinates (r, theta)
 
     const double R0 = 2.0;  // major radius
-    const std::array<double, nx> r_values = {0.1, 0.2, 0.3};  // minor radius
-    const std::array<double, ny> theta_values = {  // poloidal angle
+    const std::array<double, NX> r_values = {0.1, 0.2, 0.3};  // minor radius
+    const std::array<double, NY> theta_values = {  // poloidal angle
             0.0,
             PI / 2,
             PI,
@@ -51,13 +54,11 @@ TEST_F(CoordinateTransformTest, CylindricalToCartesian) {
     // assert
     const auto max_r = *std::max_element(begin(r_values), end(r_values));
     const auto expected_max_x = R0 + max_r;
-    // With nz=7, there is no toroidal coordinate point at exactly pi/2; the nearest point is at 2/7 * 2pi
-    const auto expected_max_y = (R0 + max_r) * std::sin(TWOPI * 2 / 7);
+    const auto expected_max_y = (R0 + max_r);
     const auto expected_max_z = max_r;
 
-    // With nz=7, there is no toroidal coordinate point at exactly pi; the nearest point is at 3/7 * 2pi
-    const auto expected_min_x = -1 * (R0 + max_r) * std::cos(TWOPI / 7 / 2);
-    const auto expected_min_y = -1 * (R0 + max_r) * std::sin(TWOPI * 2 / 7);
+    const auto expected_min_x = -1 * (R0 + max_r);
+    const auto expected_min_y = -1 * (R0 + max_r);
     const auto expected_min_z = -1 * expected_max_z;
 
     const auto actual_max_x = max(cartesian_coords.x, false, "RGN_ALL");

From c0a9155ea8ff128736f4b2d9f0f4b852109796b3 Mon Sep 17 00:00:00 2001
From: David Bold <dave@ipp.mpg.de>
Date: Thu, 12 Jun 2025 07:28:22 +0200
Subject: [PATCH 083/129] Add missing import

---
 src/solver/impls/snes/snes.cxx | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/solver/impls/snes/snes.cxx b/src/solver/impls/snes/snes.cxx
index e280ed09fa..276fade7b6 100644
--- a/src/solver/impls/snes/snes.cxx
+++ b/src/solver/impls/snes/snes.cxx
@@ -8,6 +8,7 @@
 #include <bout/boutexception.hxx>
 #include <bout/globals.hxx>
 #include <bout/msg_stack.hxx>
+#include <bout/petsc_interface.hxx>
 #include <bout/utils.hxx>
 
 #include <cmath>

From 844da11ac343c77484c5feb399610c8ba59ab41e Mon Sep 17 00:00:00 2001
From: David Bold <dave@ipp.mpg.de>
Date: Thu, 12 Jun 2025 07:50:50 +0200
Subject: [PATCH 084/129] Always cast to PetscErrorCode (*f)(void)

---
 src/solver/impls/imex-bdf2/imex-bdf2.cxx | 12 +++---------
 1 file changed, 3 insertions(+), 9 deletions(-)

diff --git a/src/solver/impls/imex-bdf2/imex-bdf2.cxx b/src/solver/impls/imex-bdf2/imex-bdf2.cxx
index 7b53f18465..2766db3e96 100644
--- a/src/solver/impls/imex-bdf2/imex-bdf2.cxx
+++ b/src/solver/impls/imex-bdf2/imex-bdf2.cxx
@@ -652,15 +652,9 @@ void IMEXBDF2::constructSNES(SNES* snesIn) {
       // Create data structure for SNESComputeJacobianDefaultColor
       MatFDColoringCreate(Jmf, iscoloring, &fdcoloring);
       // Set the function to difference
-#if PETSC_VERSION_GE(3, 24, 0) \
-    || (PETSC_VERSION_GE(3, 23, 0) && PETSC_VERSION_RELEASE != 0)
-#define FUNC_MAYBE_CAST(func) func
-#else
-#define FUNC_MAYBE_CAST(func) reinterpret_cast<MatFDColoringFn>(func)
-#endif
-      MatFDColoringSetFunction(fdcoloring, FUNC_MAYBE_CAST(FormFunctionForColoring),
-                               this);
-#undef FUNC_MAYBE_CAST
+      MatFDColoringSetFunction(
+          fdcoloring,
+          reinterpret_cast<PetscErrorCode (*f)(void)>(FormFunctionForColoring), this);
       MatFDColoringSetFromOptions(fdcoloring);
       MatFDColoringSetUp(Jmf, iscoloring, fdcoloring);
       ISColoringDestroy(&iscoloring);

From ad178b1c12dd711c69682223b656c20a2584ccb9 Mon Sep 17 00:00:00 2001
From: David Bold <dave@ipp.mpg.de>
Date: Thu, 12 Jun 2025 08:00:42 +0200
Subject: [PATCH 085/129] Fix check for release

---
 src/solver/impls/imex-bdf2/imex-bdf2.cxx | 12 +++++++++---
 1 file changed, 9 insertions(+), 3 deletions(-)

diff --git a/src/solver/impls/imex-bdf2/imex-bdf2.cxx b/src/solver/impls/imex-bdf2/imex-bdf2.cxx
index 2766db3e96..a66ec47799 100644
--- a/src/solver/impls/imex-bdf2/imex-bdf2.cxx
+++ b/src/solver/impls/imex-bdf2/imex-bdf2.cxx
@@ -652,9 +652,15 @@ void IMEXBDF2::constructSNES(SNES* snesIn) {
       // Create data structure for SNESComputeJacobianDefaultColor
       MatFDColoringCreate(Jmf, iscoloring, &fdcoloring);
       // Set the function to difference
-      MatFDColoringSetFunction(
-          fdcoloring,
-          reinterpret_cast<PetscErrorCode (*f)(void)>(FormFunctionForColoring), this);
+#if PETSC_VERSION_GE(3, 24, 0) \
+    || (PETSC_VERSION_GE(3, 23, 0) && PETSC_VERSION_RELEASE == 0)
+#define FUNC_MAYBE_CAST(func) func
+#else
+#define FUNC_MAYBE_CAST(func) reinterpret_cast<MatFDColoringFn>(func)
+#endif
+      MatFDColoringSetFunction(fdcoloring, FUNC_MAYBE_CAST(FormFunctionForColoring),
+                               this);
+#undef FUNC_MAYBE_CAST
       MatFDColoringSetFromOptions(fdcoloring);
       MatFDColoringSetUp(Jmf, iscoloring, fdcoloring);
       ISColoringDestroy(&iscoloring);

From 64b8bd0d37df382b980981b965c6efa2d03d396a Mon Sep 17 00:00:00 2001
From: tomc271 <tomc271@gmail.com>
Date: Thu, 12 Jun 2025 12:38:34 +0100
Subject: [PATCH 086/129] Use type alias FakeMeshFixture =
 FakeMeshFixture_tmpl<3, 5, 7> as a shim to allow FakeMeshFixture to be used
 with default values for nx, ny, nz

---
 tests/unit/fake_mesh_fixture.hxx              | 24 ++++++++++++-------
 .../mesh/test_change_coordinate_system.cxx    |  4 ++--
 2 files changed, 17 insertions(+), 11 deletions(-)

diff --git a/tests/unit/fake_mesh_fixture.hxx b/tests/unit/fake_mesh_fixture.hxx
index dcda38de81..d4c10107e3 100644
--- a/tests/unit/fake_mesh_fixture.hxx
+++ b/tests/unit/fake_mesh_fixture.hxx
@@ -25,15 +25,19 @@
 /// alias to make a new test:
 ///
 ///     using MyTest = FakeMeshFixture;
-class FakeMeshFixture : public ::testing::Test {
+///
+///     Type alias FakeMeshFixture = FakeMeshFixture_tmpl<3, 5, 7>;
+///     is used as a shim to allow FakeMeshFixture to be used with default values for nx, ny, nz
+template<int NX, int NY, int NZ>
+class FakeMeshFixture_tmpl : public ::testing::Test {
 public:
-    FakeMeshFixture(int nx_ = nx, int ny_ = ny, int nz_ = nz) {
+    FakeMeshFixture_tmpl() {
         WithQuietOutput quiet_info{output_info};
         WithQuietOutput quiet_warn{output_warn};
 
         delete bout::globals::mesh;
         bout::globals::mpi = new MpiWrapper();
-        bout::globals::mesh = new FakeMesh(nx_, ny_, nz_);
+        bout::globals::mesh = new FakeMesh(NX, NY, NZ);
         bout::globals::mesh->createDefaultRegions();
         static_cast<FakeMesh*>(bout::globals::mesh)->setCoordinates(nullptr);
         test_coords = std::make_shared<Coordinates>(
@@ -71,7 +75,7 @@ public:
         dynamic_cast<FakeMesh*>(bout::globals::mesh)->createBoundaryRegions();
 
         delete mesh_staggered;
-        mesh_staggered = new FakeMesh(nx_, ny_, nz_);
+        mesh_staggered = new FakeMesh(NX, NY, NZ);
         mesh_staggered->StaggerGrids = true;
         dynamic_cast<FakeMesh*>(mesh_staggered)->setCoordinates(nullptr);
         dynamic_cast<FakeMesh*>(mesh_staggered)->setCoordinates(nullptr, CELL_XLOW);
@@ -123,7 +127,7 @@ public:
                 ->setCoordinates(test_coords_staggered, CELL_ZLOW);
     }
 
-    ~FakeMeshFixture() override {
+    ~FakeMeshFixture_tmpl() override {
         delete bout::globals::mesh;
         bout::globals::mesh = nullptr;
         delete mesh_staggered;
@@ -134,12 +138,14 @@ public:
         Options::cleanup();
     }
 
-    static constexpr int nx = 3;
-    static constexpr int ny = 5;
-    static constexpr int nz = 7;
+    static constexpr int nx = NX;
+    static constexpr int ny = NY;
+    static constexpr int nz = NZ;
 
     Mesh* mesh_staggered = nullptr;
 
     std::shared_ptr<Coordinates> test_coords{nullptr};
     std::shared_ptr<Coordinates> test_coords_staggered{nullptr};
-};
\ No newline at end of file
+};
+
+using FakeMeshFixture = FakeMeshFixture_tmpl<3, 5, 7>;
\ No newline at end of file
diff --git a/tests/unit/mesh/test_change_coordinate_system.cxx b/tests/unit/mesh/test_change_coordinate_system.cxx
index c2a36ed18a..d9ae71e14c 100644
--- a/tests/unit/mesh/test_change_coordinate_system.cxx
+++ b/tests/unit/mesh/test_change_coordinate_system.cxx
@@ -11,11 +11,11 @@ static constexpr int NZ = 8;
 
 using bout::globals::mesh;
 
-class CoordinateTransformTest : public FakeMeshFixture {
+class CoordinateTransformTest : public FakeMeshFixture_tmpl<NX, NY, NZ> {
 public:
     using FieldMetric = Coordinates::FieldMetric;
 
-    CoordinateTransformTest() : FakeMeshFixture(NX, NY, NZ) {}
+    CoordinateTransformTest() : FakeMeshFixture_tmpl() {}
 };
 
 TEST_F(CoordinateTransformTest, CylindricalToCartesian) {

From 511f4a9fef63a0c5ee6ecbc6e00ee991d0f0c5cd Mon Sep 17 00:00:00 2001
From: Peter Hill <peter.hill@york.ac.uk>
Date: Tue, 17 Jun 2025 16:55:24 +0100
Subject: [PATCH 087/129] Fix PETSc version check for MatFDColoringFn typedef

---
 include/bout/petsc_interface.hxx | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/include/bout/petsc_interface.hxx b/include/bout/petsc_interface.hxx
index b59e8d9531..6957624213 100644
--- a/include/bout/petsc_interface.hxx
+++ b/include/bout/petsc_interface.hxx
@@ -569,7 +569,7 @@ PetscVector<T> operator*(const PetscMatrix<T>& mat, const PetscVector<T>& vec) {
 // Compatibility wrappers
 // For < 3.24
 #if PETSC_VERSION_GE(3, 24, 0) \
-    || (PETSC_VERSION_GE(3, 23, 0) && PETSC_VERSION_RELEASE != 0)
+    || (PETSC_VERSION_GE(3, 23, 0) && PETSC_VERSION_RELEASE == 0)
 // Nothing to do
 #else
 using MatFDColoringFn = PetscErrorCode (*)();

From fa2ff89823adf975ac9d25fa1f7a45567bae9bea Mon Sep 17 00:00:00 2001
From: Peter Hill <peter.hill@york.ac.uk>
Date: Tue, 17 Jun 2025 17:04:13 +0100
Subject: [PATCH 088/129] Move "maybe cast" macro to header for reuse

---
 include/bout/petsc_interface.hxx         |  3 ++-
 src/solver/impls/imex-bdf2/imex-bdf2.cxx | 11 ++---------
 src/solver/impls/snes/snes.cxx           |  6 +++---
 3 files changed, 7 insertions(+), 13 deletions(-)

diff --git a/include/bout/petsc_interface.hxx b/include/bout/petsc_interface.hxx
index 6957624213..8a812937d9 100644
--- a/include/bout/petsc_interface.hxx
+++ b/include/bout/petsc_interface.hxx
@@ -570,9 +570,10 @@ PetscVector<T> operator*(const PetscMatrix<T>& mat, const PetscVector<T>& vec) {
 // For < 3.24
 #if PETSC_VERSION_GE(3, 24, 0) \
     || (PETSC_VERSION_GE(3, 23, 0) && PETSC_VERSION_RELEASE == 0)
-// Nothing to do
+#define BOUT_CAST_MATFDCOLORINGFN(func) func
 #else
 using MatFDColoringFn = PetscErrorCode (*)();
+#define BOUT_CAST_MATFDCOLORINGFN(func) reinterpret_cast<MatFDColoringFn>(func)
 #endif
 
 #endif // BOUT_HAS_PETSC
diff --git a/src/solver/impls/imex-bdf2/imex-bdf2.cxx b/src/solver/impls/imex-bdf2/imex-bdf2.cxx
index a66ec47799..9205d90881 100644
--- a/src/solver/impls/imex-bdf2/imex-bdf2.cxx
+++ b/src/solver/impls/imex-bdf2/imex-bdf2.cxx
@@ -652,15 +652,8 @@ void IMEXBDF2::constructSNES(SNES* snesIn) {
       // Create data structure for SNESComputeJacobianDefaultColor
       MatFDColoringCreate(Jmf, iscoloring, &fdcoloring);
       // Set the function to difference
-#if PETSC_VERSION_GE(3, 24, 0) \
-    || (PETSC_VERSION_GE(3, 23, 0) && PETSC_VERSION_RELEASE == 0)
-#define FUNC_MAYBE_CAST(func) func
-#else
-#define FUNC_MAYBE_CAST(func) reinterpret_cast<MatFDColoringFn>(func)
-#endif
-      MatFDColoringSetFunction(fdcoloring, FUNC_MAYBE_CAST(FormFunctionForColoring),
-                               this);
-#undef FUNC_MAYBE_CAST
+      MatFDColoringSetFunction(fdcoloring,
+                               BOUT_CAST_MATFDCOLORINGFN(FormFunctionForColoring), this);
       MatFDColoringSetFromOptions(fdcoloring);
       MatFDColoringSetUp(Jmf, iscoloring, fdcoloring);
       ISColoringDestroy(&iscoloring);
diff --git a/src/solver/impls/snes/snes.cxx b/src/solver/impls/snes/snes.cxx
index 276fade7b6..890048a52b 100644
--- a/src/solver/impls/snes/snes.cxx
+++ b/src/solver/impls/snes/snes.cxx
@@ -82,7 +82,7 @@ static PetscErrorCode FormFunctionForDifferencing(void* ctx, Vec x, Vec f) {
  *
  * This can be a linearised and simplified form of FormFunction
  */
-static PetscErrorCode FormFunctionForColoring(SNES UNUSED(snes), Vec x, Vec f,
+static PetscErrorCode FormFunctionForColoring(void* UNUSED(snes), Vec x, Vec f,
                                               void* ctx) {
   return static_cast<SNESSolver*>(ctx)->snes_function(x, f, true);
 }
@@ -1292,8 +1292,8 @@ void SNESSolver::updateColoring() {
   // Replace the old coloring with the new one
   MatFDColoringDestroy(&fdcoloring);
   MatFDColoringCreate(Jfd, iscoloring, &fdcoloring);
-  MatFDColoringSetFunction(
-      fdcoloring, reinterpret_cast<MatFDColoringFn>(FormFunctionForColoring), this);
+  MatFDColoringSetFunction(fdcoloring, BOUT_CAST_MATFDCOLORINGFN(FormFunctionForColoring),
+                           this);
   MatFDColoringSetFromOptions(fdcoloring);
   MatFDColoringSetUp(Jfd, iscoloring, fdcoloring);
   ISColoringDestroy(&iscoloring);

From 6a7e43ed5e231e29a2eead4f6ce1e1821a7e9d53 Mon Sep 17 00:00:00 2001
From: Peter Hill <peter.hill@york.ac.uk>
Date: Tue, 17 Jun 2025 18:08:05 +0100
Subject: [PATCH 089/129] Convert macro to constexpr template function

Removes some clang-tidy warnings and silences one about reinterpret_cast
---
 include/bout/petsc_interface.hxx         | 12 ++++++++++--
 src/solver/impls/imex-bdf2/imex-bdf2.cxx |  2 +-
 src/solver/impls/snes/snes.cxx           |  2 +-
 3 files changed, 12 insertions(+), 4 deletions(-)

diff --git a/include/bout/petsc_interface.hxx b/include/bout/petsc_interface.hxx
index 8a812937d9..d520276cfc 100644
--- a/include/bout/petsc_interface.hxx
+++ b/include/bout/petsc_interface.hxx
@@ -570,10 +570,18 @@ PetscVector<T> operator*(const PetscMatrix<T>& mat, const PetscVector<T>& vec) {
 // For < 3.24
 #if PETSC_VERSION_GE(3, 24, 0) \
     || (PETSC_VERSION_GE(3, 23, 0) && PETSC_VERSION_RELEASE == 0)
-#define BOUT_CAST_MATFDCOLORINGFN(func) func
+namespace bout {
+template<class T>
+constexpr auto cast_MatFDColoringFn(T func) { return func; }
+}
 #else
 using MatFDColoringFn = PetscErrorCode (*)();
-#define BOUT_CAST_MATFDCOLORINGFN(func) reinterpret_cast<MatFDColoringFn>(func)
+namespace bout {
+template<class T>
+constexpr auto cast_MatFDColoringFn(T func) {
+  return reinterpret_cast<MatFDColoringFn>(func); // NOLINT(*-reinterpret-cast)
+}
+}
 #endif
 
 #endif // BOUT_HAS_PETSC
diff --git a/src/solver/impls/imex-bdf2/imex-bdf2.cxx b/src/solver/impls/imex-bdf2/imex-bdf2.cxx
index 9205d90881..07188110ab 100644
--- a/src/solver/impls/imex-bdf2/imex-bdf2.cxx
+++ b/src/solver/impls/imex-bdf2/imex-bdf2.cxx
@@ -653,7 +653,7 @@ void IMEXBDF2::constructSNES(SNES* snesIn) {
       MatFDColoringCreate(Jmf, iscoloring, &fdcoloring);
       // Set the function to difference
       MatFDColoringSetFunction(fdcoloring,
-                               BOUT_CAST_MATFDCOLORINGFN(FormFunctionForColoring), this);
+                               bout::cast_MatFDColoringFn(FormFunctionForColoring), this);
       MatFDColoringSetFromOptions(fdcoloring);
       MatFDColoringSetUp(Jmf, iscoloring, fdcoloring);
       ISColoringDestroy(&iscoloring);
diff --git a/src/solver/impls/snes/snes.cxx b/src/solver/impls/snes/snes.cxx
index 890048a52b..8fad1e5d63 100644
--- a/src/solver/impls/snes/snes.cxx
+++ b/src/solver/impls/snes/snes.cxx
@@ -1292,7 +1292,7 @@ void SNESSolver::updateColoring() {
   // Replace the old coloring with the new one
   MatFDColoringDestroy(&fdcoloring);
   MatFDColoringCreate(Jfd, iscoloring, &fdcoloring);
-  MatFDColoringSetFunction(fdcoloring, BOUT_CAST_MATFDCOLORINGFN(FormFunctionForColoring),
+  MatFDColoringSetFunction(fdcoloring, bout::cast_MatFDColoringFn(FormFunctionForColoring),
                            this);
   MatFDColoringSetFromOptions(fdcoloring);
   MatFDColoringSetUp(Jfd, iscoloring, fdcoloring);

From 5a14fa21f84e57f3e9801f5c4c76f8d093cf8894 Mon Sep 17 00:00:00 2001
From: ZedThree <1486942+ZedThree@users.noreply.github.com>
Date: Tue, 17 Jun 2025 17:10:16 +0000
Subject: [PATCH 090/129] Apply clang-format changes

---
 include/bout/petsc_interface.hxx | 10 ++++++----
 src/solver/impls/snes/snes.cxx   |  4 ++--
 2 files changed, 8 insertions(+), 6 deletions(-)

diff --git a/include/bout/petsc_interface.hxx b/include/bout/petsc_interface.hxx
index d520276cfc..90dd188d8a 100644
--- a/include/bout/petsc_interface.hxx
+++ b/include/bout/petsc_interface.hxx
@@ -571,17 +571,19 @@ PetscVector<T> operator*(const PetscMatrix<T>& mat, const PetscVector<T>& vec) {
 #if PETSC_VERSION_GE(3, 24, 0) \
     || (PETSC_VERSION_GE(3, 23, 0) && PETSC_VERSION_RELEASE == 0)
 namespace bout {
-template<class T>
-constexpr auto cast_MatFDColoringFn(T func) { return func; }
+template <class T>
+constexpr auto cast_MatFDColoringFn(T func) {
+  return func;
 }
+} // namespace bout
 #else
 using MatFDColoringFn = PetscErrorCode (*)();
 namespace bout {
-template<class T>
+template <class T>
 constexpr auto cast_MatFDColoringFn(T func) {
   return reinterpret_cast<MatFDColoringFn>(func); // NOLINT(*-reinterpret-cast)
 }
-}
+} // namespace bout
 #endif
 
 #endif // BOUT_HAS_PETSC
diff --git a/src/solver/impls/snes/snes.cxx b/src/solver/impls/snes/snes.cxx
index 8fad1e5d63..d516f19214 100644
--- a/src/solver/impls/snes/snes.cxx
+++ b/src/solver/impls/snes/snes.cxx
@@ -1292,8 +1292,8 @@ void SNESSolver::updateColoring() {
   // Replace the old coloring with the new one
   MatFDColoringDestroy(&fdcoloring);
   MatFDColoringCreate(Jfd, iscoloring, &fdcoloring);
-  MatFDColoringSetFunction(fdcoloring, bout::cast_MatFDColoringFn(FormFunctionForColoring),
-                           this);
+  MatFDColoringSetFunction(fdcoloring,
+                           bout::cast_MatFDColoringFn(FormFunctionForColoring), this);
   MatFDColoringSetFromOptions(fdcoloring);
   MatFDColoringSetUp(Jfd, iscoloring, fdcoloring);
   ISColoringDestroy(&iscoloring);

From 15a2397f319854c348d5987294946dce5e4f12a6 Mon Sep 17 00:00:00 2001
From: Steven Roberts <roberts115@llnl.gov>
Date: Tue, 17 Jun 2025 18:12:09 -0700
Subject: [PATCH 091/129] Fixes for ELM-PB preconditioner

---
 examples/elm-pb/elm_pb.cxx | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/examples/elm-pb/elm_pb.cxx b/examples/elm-pb/elm_pb.cxx
index 1a2608e62c..d981796200 100644
--- a/examples/elm-pb/elm_pb.cxx
+++ b/examples/elm-pb/elm_pb.cxx
@@ -2041,6 +2041,7 @@ class ELMpb : public PhysicsModel {
   int precon(BoutReal UNUSED(t), BoutReal gamma, BoutReal UNUSED(delta)) {
     // First matrix, applying L
     mesh->communicate(ddt(Psi));
+    ddt(Psi).applyBoundary("neumann");
     Field3D Jrhs;
     if (laplace_perp) {
       Jrhs = Laplace_perp(ddt(Psi));
@@ -2072,9 +2073,10 @@ class ELMpb : public PhysicsModel {
     }
 
     mesh->communicate(Jrhs, ddt(P));
+    ddt(P).applyBoundary("neumann");
 
     Field3D U1 = ddt(U);
-    U1 += (gamma * B0 * B0) * Grad_par(Jrhs, CELL_CENTRE) + (gamma * b0xcv) * Grad(P);
+    U1 += (gamma * B0 * B0) * Grad_par(Jrhs, CELL_CENTRE) + (gamma * b0xcv) * Grad(ddt(P));
 
     // Second matrix, solving Alfven wave dynamics
     static std::unique_ptr<InvertPar> invU{nullptr};

From f880dcb62c6dba8df336bcb2e7d1d100651c1807 Mon Sep 17 00:00:00 2001
From: bendudson <219233+bendudson@users.noreply.github.com>
Date: Sat, 21 Jun 2025 04:21:03 +0000
Subject: [PATCH 092/129] Apply clang-format changes

---
 include/bout/hypre_interface.hxx | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/include/bout/hypre_interface.hxx b/include/bout/hypre_interface.hxx
index 15ca97cb8a..365dd715e6 100644
--- a/include/bout/hypre_interface.hxx
+++ b/include/bout/hypre_interface.hxx
@@ -1036,12 +1036,12 @@ public:
     case HYPRE_SOLVER_TYPE::gmres: {
       HYPRE_ParCSRGMRESSetKDim(solver,
                                options["kdim"]
-                                 .doc("Set the maximum size of the Krylov space")
-                                 .withDefault(30));
+                                   .doc("Set the maximum size of the Krylov space")
+                                   .withDefault(30));
 
       if (options["skip_real_residual_check"]
-          .doc("Skip the evaluation and the check of the actual residual?")
-          .withDefault<bool>(false)) {
+              .doc("Skip the evaluation and the check of the actual residual?")
+              .withDefault<bool>(false)) {
         HYPRE_GMRESSetSkipRealResidualCheck(solver, 1);
       }
       break;

From 10ccee39de8882f7b3b7d54263660e31f06a9323 Mon Sep 17 00:00:00 2001
From: tomc271 <tomc271@gmail.com>
Date: Tue, 10 Jun 2025 12:49:11 +0100
Subject: [PATCH 093/129] Add nx, ny, nz as optional arguments to
 FakeMeshFixture constructor

---
 tests/unit/fake_mesh_fixture.hxx | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/unit/fake_mesh_fixture.hxx b/tests/unit/fake_mesh_fixture.hxx
index 42f7be5446..2b4c164675 100644
--- a/tests/unit/fake_mesh_fixture.hxx
+++ b/tests/unit/fake_mesh_fixture.hxx
@@ -27,8 +27,8 @@
 ///     using MyTest = FakeMeshFixture;
 class FakeMeshFixture : public ::testing::Test {
 public:
-  FakeMeshFixture()
-      : mesh_m(nx, ny, nz, mpi), mesh_staggered_m(nx, ny, nz, mpi),
+  FakeMeshFixture(int nx_ = nx, int ny_ = ny, int nz_ = nz)
+      : mesh_m(nx_, ny_, nz_, mpi), mesh_staggered_m(nx_, ny_, nz_, mpi),
         mesh_staggered(&mesh_staggered_m) {
 
     bout::globals::mpi = &mpi;

From f69ccdc5ebbd3b289822bb6b08d67deffebf1019 Mon Sep 17 00:00:00 2001
From: tomc271 <tomc271@gmail.com>
Date: Thu, 12 Jun 2025 12:38:34 +0100
Subject: [PATCH 094/129] Use type alias FakeMeshFixture =
 FakeMeshFixture_tmpl<3, 5, 7> as a shim to allow FakeMeshFixture to be used
 with default values for nx, ny, nz

---
 tests/unit/fake_mesh_fixture.hxx | 28 +++++++++++++++++-----------
 1 file changed, 17 insertions(+), 11 deletions(-)

diff --git a/tests/unit/fake_mesh_fixture.hxx b/tests/unit/fake_mesh_fixture.hxx
index 2b4c164675..68b0ac83b1 100644
--- a/tests/unit/fake_mesh_fixture.hxx
+++ b/tests/unit/fake_mesh_fixture.hxx
@@ -25,10 +25,14 @@
 /// alias to make a new test:
 ///
 ///     using MyTest = FakeMeshFixture;
-class FakeMeshFixture : public ::testing::Test {
+///
+///     Type alias FakeMeshFixture = FakeMeshFixture_tmpl<3, 5, 7>;
+///     is used as a shim to allow FakeMeshFixture to be used with default values for nx, ny, nz
+template<int NX, int NY, int NZ>
+class FakeMeshFixture_tmpl : public ::testing::Test {
 public:
-  FakeMeshFixture(int nx_ = nx, int ny_ = ny, int nz_ = nz)
-      : mesh_m(nx_, ny_, nz_, mpi), mesh_staggered_m(nx_, ny_, nz_, mpi),
+  FakeMeshFixture_tmpl()
+      : mesh_m(NX, NY, NZ, mpi), mesh_staggered_m(NX, NY, NZ, mpi),
         mesh_staggered(&mesh_staggered_m) {
 
     bout::globals::mpi = &mpi;
@@ -108,21 +112,21 @@ public:
     mesh_staggered_m.setCoordinates(test_coords_staggered, CELL_ZLOW);
   }
 
-  FakeMeshFixture(const FakeMeshFixture&) = delete;
-  FakeMeshFixture& operator=(const FakeMeshFixture&) = delete;
-  FakeMeshFixture(FakeMeshFixture&&) = delete;
-  FakeMeshFixture& operator=(FakeMeshFixture&&) = delete;
+  FakeMeshFixture_tmpl(const FakeMeshFixture_tmpl&) = delete;
+  FakeMeshFixture_tmpl& operator=(const FakeMeshFixture_tmpl&) = delete;
+  FakeMeshFixture_tmpl(FakeMeshFixture_tmpl&&) = delete;
+  FakeMeshFixture_tmpl& operator=(FakeMeshFixture_tmpl&&) = delete;
 
-  ~FakeMeshFixture() override {
+  ~FakeMeshFixture_tmpl() override {
     bout::globals::mesh = nullptr;
     bout::globals::mpi = nullptr;
 
     Options::cleanup();
   }
 
-  static constexpr int nx = 3;
-  static constexpr int ny = 5;
-  static constexpr int nz = 7;
+  static constexpr int nx = NX;
+  static constexpr int ny = NY;
+  static constexpr int nz = NZ;
 
 private:
   std::shared_ptr<Coordinates> test_coords{nullptr};
@@ -139,3 +143,5 @@ public:
   // Public pointer to our staggered mesh
   Mesh* mesh_staggered; // NOLINT
 };
+
+using FakeMeshFixture = FakeMeshFixture_tmpl<3, 5, 7>;

From d3bd5f9b017b6dbcf59cd211642bd5d75bce28e9 Mon Sep 17 00:00:00 2001
From: tomc271 <58003025+tomc271@users.noreply.github.com>
Date: Mon, 23 Jun 2025 15:25:19 +0000
Subject: [PATCH 095/129] Apply clang-format changes

---
 tests/unit/fake_mesh_fixture.hxx | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/unit/fake_mesh_fixture.hxx b/tests/unit/fake_mesh_fixture.hxx
index 68b0ac83b1..d717cfb826 100644
--- a/tests/unit/fake_mesh_fixture.hxx
+++ b/tests/unit/fake_mesh_fixture.hxx
@@ -28,7 +28,7 @@
 ///
 ///     Type alias FakeMeshFixture = FakeMeshFixture_tmpl<3, 5, 7>;
 ///     is used as a shim to allow FakeMeshFixture to be used with default values for nx, ny, nz
-template<int NX, int NY, int NZ>
+template <int NX, int NY, int NZ>
 class FakeMeshFixture_tmpl : public ::testing::Test {
 public:
   FakeMeshFixture_tmpl()

From d7cdc65e6f9de35499d50efd0429cc6d27ab96ee Mon Sep 17 00:00:00 2001
From: Peter Hill <peter.hill@york.ac.uk>
Date: Mon, 23 Jun 2025 16:36:47 +0100
Subject: [PATCH 096/129] Small tidy of test class docstring

---
 tests/unit/fake_mesh_fixture.hxx | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/tests/unit/fake_mesh_fixture.hxx b/tests/unit/fake_mesh_fixture.hxx
index d717cfb826..2758dbe416 100644
--- a/tests/unit/fake_mesh_fixture.hxx
+++ b/tests/unit/fake_mesh_fixture.hxx
@@ -26,8 +26,11 @@
 ///
 ///     using MyTest = FakeMeshFixture;
 ///
-///     Type alias FakeMeshFixture = FakeMeshFixture_tmpl<3, 5, 7>;
-///     is used as a shim to allow FakeMeshFixture to be used with default values for nx, ny, nz
+/// Type alias `FakeMeshFixture = FakeMeshFixture_tmpl<3, 5, 7>`
+/// is used as a shim to allow FakeMeshFixture to be used with default values for nx, ny, nz.
+/// Use this template class directly to use different sized grid:
+///
+///     using MyTest = FakeMeshFixture_tmpl<7, 9, 11>;
 template <int NX, int NY, int NZ>
 class FakeMeshFixture_tmpl : public ::testing::Test {
 public:

From 391b06bcf9daff93bf627e085a2b1bec61367dea Mon Sep 17 00:00:00 2001
From: David Bold <dave@ipp.mpg.de>
Date: Tue, 24 Jun 2025 10:54:16 +0200
Subject: [PATCH 097/129] CI: Switch to released fedora

Resolves: #3127
---
 .github/workflows/tests.yml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/tests.yml b/.github/workflows/tests.yml
index 90c63e0233..4153ebaefc 100644
--- a/.github/workflows/tests.yml
+++ b/.github/workflows/tests.yml
@@ -208,8 +208,8 @@ jobs:
       - uses: actions/checkout@v4
         with:
           submodules: true
-      - name: Build Fedora rawhide
-        run: ./.ci_fedora.sh setup openmpi rawhide
+      - name: Build Fedora
+        run: ./.ci_fedora.sh setup openmpi latest
         shell: bash
         env:
           TRAVIS_BUILD_DIR: ${{ github.workspace }}

From 1fa55d25e9a0c3c2d494179709cbe48e77f2c4c2 Mon Sep 17 00:00:00 2001
From: David Bold <dave@ipp.mpg.de>
Date: Tue, 24 Jun 2025 11:37:26 +0200
Subject: [PATCH 098/129] CI: require python3-boutuils

---
 .ci_fedora.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.ci_fedora.sh b/.ci_fedora.sh
index 359516ab33..5f0a36efea 100755
--- a/.ci_fedora.sh
+++ b/.ci_fedora.sh
@@ -43,7 +43,7 @@ then
     echo "minrate=10M" >> /etc/dnf/dnf.conf
     export FORCE_COLUMNS=200
     time dnf -y install dnf5
-    time dnf5 -y install dnf5-plugins cmake python3-zoidberg python3-natsort
+    time dnf5 -y install dnf5-plugins cmake python3-zoidberg python3-natsort python3-boututils
     # Allow to override packages - see #2073
     time dnf5 copr enable -y davidsch/fixes4bout || :
     time dnf5 -y upgrade

From 81befc23a51139f22c8b2835cacebd16dfdd5457 Mon Sep 17 00:00:00 2001
From: Peter Hill <peter.hill@york.ac.uk>
Date: Tue, 24 Jun 2025 15:24:05 +0100
Subject: [PATCH 099/129] Revert "Merge pull request #3082 from
 boutproject/next-elimBE"

This reverts commit e080493b169310f0da60811e21b463f94512d9e1, reversing
changes made to 520ba0609932639f025b13517294101705a72b77.
---
 CMakeLists.txt                                |   1 -
 include/bout/hypre_interface.hxx              | 185 +-----------------
 .../laplace/impls/hypre3d/hypre3d_laplace.cxx |   5 -
 src/sys/hypre_interface.cxx                   | 131 -------------
 tests/integrated/test-laplace-hypre3d/runtest |  14 +-
 5 files changed, 7 insertions(+), 329 deletions(-)
 delete mode 100644 src/sys/hypre_interface.cxx

diff --git a/CMakeLists.txt b/CMakeLists.txt
index af628a7db5..c45fca3b72 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -335,7 +335,6 @@ set(BOUT_SOURCES
   ./src/sys/generator_context.cxx
   ./include/bout/hyprelib.hxx
   ./src/sys/hyprelib.cxx
-  ./src/sys/hypre_interface.cxx
   ./src/sys/msg_stack.cxx
   ./src/sys/options.cxx
   ./src/sys/options/optionparser.hxx
diff --git a/include/bout/hypre_interface.hxx b/include/bout/hypre_interface.hxx
index 365dd715e6..ae392de4f3 100644
--- a/include/bout/hypre_interface.hxx
+++ b/include/bout/hypre_interface.hxx
@@ -58,110 +58,6 @@ int checkHypreError(int error) {
 // TODO: set sizes
 // TODO: set contiguous blocks at once
 
-/// Wrapper around HYPRE_Complex, that calls HypreFree when destroyed.
-struct HypreComplexArray {
-  HYPRE_Complex* data;
-
-  HypreComplexArray(int n) { HypreMalloc(data, sizeof(HYPRE_Complex) * n); }
-
-  ~HypreComplexArray() { HypreFree(data); }
-};
-
-/// Shared pointter to a HypreComplexArray. When the last copy is destroyed
-/// the HYPRE_Complex array inside will be free'd.
-using BCValuesPtr = std::shared_ptr<HypreComplexArray>;
-
-/*!
- * This function modifies the input for the HYPRE_IJMatrixSetValues() routine to
- * eliminate the boundary condition equations (see below for details on how the
- * equations are adjusted).  It modifies the arrays ncols, rows, cols, and
- * values.  It also returns a row_indexes array.  This can then be passed to the
- * HYPRE_IJMatrixSetValues2() routine to set up the matrix in hypre.
- *
- * The arguments nb and bi_array indicate the boundary equations.  The routine
- * returns info needed to adjust the right-hand-side and solution vector through
- * the functions AdjustRightHandSideEquations and AdjustSolutionEquations.
- *
- * NOTE: It may make sense from an organizational standpoint to collect many of
- * these arguments in a structure of some sort.
- *
- * Notation, assumptions, and other details:
- *
- * - Boundary equation i is assumed to have two coefficients
- *
- *      b_ii * u_i + b_ij * u_j = rhs_i
- *
- * - We also assume that each boundary equation has only one interior equation k
- *   coupled to it (such that k = j) with coupling coefficient a_ki
- *
- *      a_ki * u_i + a_kj * u_j + ... = rhs_k
- *
- * - Each equation k is adjusted as follows:
- *
- *      a_kj = a_kj - a_ki * b_ij / b_ii
- *      a_ki = 0
- *
- * - Boundary equations are adjusted to be identity equations in the matrix, but
- *   the boundary coefficients (b_ii, b_ij) are returned for use later
- *
- * - Right-hand-side equations are adjusted in AdjustRightHandSideEquations() as
- *   follows: rhs_k = rhs_k - a_ki * rhs_i / b_ii
- *
- * - Solution unknowns are adjusted at boundaries in AdjustSolutionEquations as
- *   follows: u_i = (rhs_i - b_ij * u_j) / b_ii
- *
- * - Naming conventions: Arrays starting with 'b' are boundary equation arrays
- *   indexed by 'bnum', and arrays starting with 'a' are non-boundary arrays
- *   (interior matrix equations) indexed by 'anum'.  When 'num' is prefixed with
- *   a row or column number 'i', 'j', or 'k', the array holds the corresponding
- *   local data index for that row or column (e.g., an index into the local
- *   solution vector).  Matrix coefficients are named as above, e.g., 'bij' is
- *   the coefficient for b_ij.
- *
- *   NOTE: Implementation in src/sys/hypre_interface.cxx
- */
-struct BCMatrixEquations {
-  HYPRE_Int nb;
-  HYPRE_Int* binum_array;
-  HYPRE_Int* bjnum_array;
-  HYPRE_Complex* bii_array;
-  HYPRE_Complex* bij_array;
-  HYPRE_Int na;
-  HYPRE_Int* aknum_array;
-  HYPRE_Complex* aki_array;
-
-  BCMatrixEquations() = delete;
-
-  BCMatrixEquations(HYPRE_Int nrows, HYPRE_Int* ncols, HYPRE_BigInt* rows,
-                    HYPRE_Int** row_indexes_ptr, HYPRE_BigInt* cols,
-                    HYPRE_Complex* values,
-                    HYPRE_Int nb,         // number of boundary equations
-                    HYPRE_Int* bi_array); // row i for each boundary equation
-
-  ~BCMatrixEquations() {
-    // Free arrays
-    HypreFree(binum_array);
-    HypreFree(bjnum_array);
-    HypreFree(bii_array);
-    HypreFree(bij_array);
-    HypreFree(aknum_array);
-    HypreFree(aki_array);
-  }
-
-  /// Applies in-place modification of the rhs array.
-  ///
-  /// Returns an array of boundary values that can be used to apply
-  /// boundary conditions to a solution vector.
-  BCValuesPtr adjustBCRightHandSideEquations(HYPRE_Complex* rhs);
-
-  /// Apply boundary conditions to the solution.
-  /// Uses the BCValuesPtr returned from adjustBCRightHandSideEquations()
-  void adjustBCSolutionEquations(BCValuesPtr brhs, HYPRE_Complex* solution);
-};
-
-/// A shared pointer to a BCMatrixEquations object
-using BCMatrixPtr = std::shared_ptr<BCMatrixEquations>;
-
 template <class T>
 class HypreVector {
   MPI_Comm comm;
@@ -278,14 +174,6 @@ public:
     HypreMalloc(V, vsize * sizeof(HYPRE_Complex));
   }
 
-  // Data for eliminating boundary equation
-  bool elimBErhs = false;
-  bool elimBEsol = false;
-  BCMatrixPtr bcmatrix;
-  BCValuesPtr bcvalues; /// Stores rhs values of BC rows
-
-  void syncElimBErhs(HypreVector<T>& rhs) { bcvalues = rhs.bcvalues; }
-
   void assemble() {
     CALI_CXX_MARK_FUNCTION;
     writeCacheToHypre();
@@ -295,17 +183,11 @@ public:
   }
 
   void writeCacheToHypre() {
-    if (elimBErhs) {
-      bcvalues = bcmatrix->adjustBCRightHandSideEquations(V);
-    }
     checkHypreError(HYPRE_IJVectorSetValues(hypre_vector, vsize, I, V));
   }
 
   void readCacheFromHypre() {
     checkHypreError(HYPRE_IJVectorGetValues(hypre_vector, vsize, I, V));
-    if (elimBEsol) {
-      bcmatrix->adjustBCSolutionEquations(bcvalues, V);
-    }
   }
 
   T toField() {
@@ -785,20 +667,6 @@ public:
     return Element(*this, global_row, global_column, positions, weights);
   }
 
-  // Data for eliminating boundary equations
-  bool elimBE = false;
-  BCMatrixPtr bcmatrix; // Shared pointer
-
-  void setElimBE() { elimBE = true; }
-
-  void setElimBEVectors(HypreVector<T>& sol, HypreVector<T>& rhs) {
-    sol.elimBEsol = elimBE;
-    sol.bcmatrix = bcmatrix;
-
-    rhs.elimBErhs = elimBE;
-    rhs.bcmatrix = bcmatrix;
-  }
-
   void assemble() {
     CALI_CXX_MARK_FUNCTION;
 
@@ -827,32 +695,8 @@ public:
         entry++;
       }
     }
-
-    // Eliminate boundary condition equations in hypre SetValues input arguments
-    if (elimBE) {
-      HYPRE_Int* bi_array;
-      HYPRE_Int* row_indexes;
-      // There must be an easier way to get nb
-      int nb = 0;
-      BOUT_FOR_SERIAL(i, index_converter->getRegionBndry()) { nb++; }
-      HypreMalloc(bi_array, nb * sizeof(HYPRE_Int));
-      nb = 0;
-      BOUT_FOR_SERIAL(i, index_converter->getRegionBndry()) {
-        bi_array[nb] = index_converter->getGlobal(i);
-        nb++;
-      }
-
-      bcmatrix = std::make_shared<BCMatrixEquations>(
-          num_rows, num_cols, rawI, &row_indexes, cols, vals, nb, bi_array);
-      HypreFree(bi_array);
-
-      checkHypreError(HYPRE_IJMatrixSetValues2(*hypre_matrix, num_rows, num_cols, rawI,
-                                               row_indexes, cols, vals));
-      HypreFree(row_indexes);
-    } else {
-      checkHypreError(
-          HYPRE_IJMatrixSetValues(*hypre_matrix, num_rows, num_cols, rawI, cols, vals));
-    }
+    checkHypreError(
+        HYPRE_IJMatrixSetValues(*hypre_matrix, num_rows, num_cols, rawI, cols, vals));
     checkHypreError(HYPRE_IJMatrixAssemble(*hypre_matrix));
     checkHypreError(HYPRE_IJMatrixGetObject(*hypre_matrix,
                                             reinterpret_cast<void**>(&parallel_matrix)));
@@ -1032,31 +876,6 @@ public:
     setMaxIter(
         options["maxits"].doc("Maximum iterations for Hypre solver").withDefault(10000));
 
-    switch (solver_type) {
-    case HYPRE_SOLVER_TYPE::gmres: {
-      HYPRE_ParCSRGMRESSetKDim(solver,
-                               options["kdim"]
-                                   .doc("Set the maximum size of the Krylov space")
-                                   .withDefault(30));
-
-      if (options["skip_real_residual_check"]
-              .doc("Skip the evaluation and the check of the actual residual?")
-              .withDefault<bool>(false)) {
-        HYPRE_GMRESSetSkipRealResidualCheck(solver, 1);
-      }
-      break;
-    }
-    case HYPRE_SOLVER_TYPE::bicgstab: {
-      break;
-    }
-    case HYPRE_SOLVER_TYPE::pcg: {
-      break;
-    }
-    default: {
-      throw BoutException("Unsupported hypre_solver_type {}", toString(solver_type));
-    }
-    }
-
     HYPRE_BoomerAMGCreate(&precon);
     HYPRE_BoomerAMGSetOldDefault(precon);
 #if BOUT_HAS_CUDA
diff --git a/src/invert/laplace/impls/hypre3d/hypre3d_laplace.cxx b/src/invert/laplace/impls/hypre3d/hypre3d_laplace.cxx
index beb83a216d..c50be1db85 100644
--- a/src/invert/laplace/impls/hypre3d/hypre3d_laplace.cxx
+++ b/src/invert/laplace/impls/hypre3d/hypre3d_laplace.cxx
@@ -218,15 +218,11 @@ Field3D LaplaceHypre3d::solve(const Field3D& b_in, const Field3D& x0) {
 
   CALI_MARK_BEGIN("LaplaceHypre3d_solve:vectorAssemble");
 
-  operator3D.setElimBEVectors(solution, rhs);
-
   rhs.importValuesFromField(b);
   solution.importValuesFromField(x0);
   rhs.assemble();
   solution.assemble();
 
-  solution.syncElimBErhs(rhs);
-
   CALI_MARK_END("LaplaceHypre3d_solve:vectorAssemble");
 
   CALI_MARK_BEGIN("LaplaceHypre3d_solve:solve");
@@ -415,7 +411,6 @@ void LaplaceHypre3d::updateMatrix3D() {
     operator3D.ydown(ydown)(l, l.ym().zp()) += -C_d2f_dydz;
     operator3D.ydown(ydown)(l, l.ym().zm()) += C_d2f_dydz;
   }
-  operator3D.setElimBE();
   operator3D.assemble();
 
   if (print_matrix) {
diff --git a/src/sys/hypre_interface.cxx b/src/sys/hypre_interface.cxx
deleted file mode 100644
index 1838bd5158..0000000000
--- a/src/sys/hypre_interface.cxx
+++ /dev/null
@@ -1,131 +0,0 @@
-
-#include "bout/build_defines.hxx"
-
-#if BOUT_HAS_HYPRE
-
-#include "bout/hypre_interface.hxx"
-
-namespace bout {
-
-BCMatrixEquations::BCMatrixEquations(HYPRE_Int nrows, HYPRE_Int* ncols,
-                                     HYPRE_BigInt* rows, HYPRE_Int** row_indexes_ptr,
-                                     HYPRE_BigInt* cols, HYPRE_Complex* values,
-                                     HYPRE_Int nb, HYPRE_Int* bi_array)
-    : nb(nb) {
-  HYPRE_Int* row_indexes;
-
-  // Create the row_indexes array
-  row_indexes = (HYPRE_Int*)malloc(sizeof(HYPRE_Int) * nrows);
-  row_indexes[0] = 0;
-  for (HYPRE_Int i = 1; i < nrows; i++) {
-    row_indexes[i] = row_indexes[i - 1] + ncols[i - 1];
-  }
-
-  // Assume just one interior equation coupled to each boundary equation
-  na = nb;
-
-  // Allocate arrays
-  HypreMalloc(binum_array, sizeof(HYPRE_Int) * nb);
-  HypreMalloc(bjnum_array, sizeof(HYPRE_Int) * nb);
-  HypreMalloc(bii_array, sizeof(HYPRE_Complex) * nb);
-  HypreMalloc(bij_array, sizeof(HYPRE_Complex) * nb);
-  HypreMalloc(aknum_array, sizeof(HYPRE_Int) * na);
-  HypreMalloc(aki_array, sizeof(HYPRE_Complex) * na);
-
-  HYPRE_Int binum = 0;
-  HYPRE_Int aknum = 0;
-  for (HYPRE_Int bnum = 0; bnum < nb; bnum++) {
-    // Get boundary equation information and adjust boundary equations
-    // Find row i in rows array (assume i increases and rows is sorted)
-    HYPRE_Int i = bi_array[bnum];
-    for (; binum < nrows; binum++) {
-      if (i == rows[binum]) {
-        break; // Found row i in rows array
-      }
-    }
-    HYPRE_Int bcoeffnum = row_indexes[binum];
-    HYPRE_Complex bii{0.0}, bij{0.0};
-    HYPRE_Int j = 0;
-
-    for (HYPRE_Int m = 0; m < 2; m++) { // Assume only two boundary equation coefficients
-      if (cols[bcoeffnum + m] == i) {
-        bii = values[bcoeffnum + m];
-        values[bcoeffnum + m] = -1.0; // Identity equation (negative definite matrix)
-      } else {
-        j = cols[bcoeffnum + m];
-        bij = values[bcoeffnum + m];
-        values[bcoeffnum + m] = 0.0; // Identity equation
-      }
-    }
-    ncols[binum] = 1; // Identity equation
-
-    /* Get interior equation information and adjust interior equations */
-    /* Find row k in rows array (assume k increases and rows is sorted) */
-    HYPRE_Int k = j; // Assume equation k = j
-    for (; aknum < nrows; aknum++) {
-      if (k == rows[aknum]) {
-        break; // Found row k in rows array
-      }
-    }
-    HYPRE_Int acoeffnum = row_indexes[aknum];
-
-    HYPRE_Int mkj = 0;
-    HYPRE_Complex aki{0.0};
-    for (HYPRE_Int m = 0; m < ncols[aknum]; m++) {
-      if (cols[acoeffnum + m] == j) {
-        mkj = m; // Save for update of akj value below
-      }
-      if (cols[acoeffnum + m] == i) {
-        aki = values[acoeffnum + m];
-        values[acoeffnum + m] = 0.0; // Eliminate coupling to boundary equation
-      }
-    }
-    values[acoeffnum + mkj] -= aki * bij / bii; // Update akj value
-
-    // Update arrays
-    HYPRE_Int anum = bnum; // Assume only one interior equation k
-    binum_array[bnum] = binum;
-    bjnum_array[bnum] = aknum; // Assume only one interior equation k
-    bii_array[bnum] = bii;
-    bij_array[bnum] = bij;
-    aknum_array[anum] = aknum;
-    aki_array[anum] = aki;
-  }
-
-  // Set return arguments
-  *row_indexes_ptr = row_indexes;
-}
-
-BCValuesPtr BCMatrixEquations::adjustBCRightHandSideEquations(HYPRE_Complex* rhs) {
-
-  // Allocate array to store boundary row values
-  BCValuesPtr brhs = std::make_shared<HypreComplexArray>(nb);
-
-  for (HYPRE_Int bnum = 0; bnum < nb; bnum++) {
-    HYPRE_Int binum = binum_array[bnum];
-    brhs->data[bnum] = rhs[binum];
-  }
-
-  for (HYPRE_Int anum = 0; anum < na; anum++) {
-    HYPRE_Int bnum = anum; // Assume only one interior equation per boundary equation
-    HYPRE_Int aknum = aknum_array[anum];
-    rhs[aknum] -= aki_array[anum] * brhs->data[bnum] / bii_array[bnum];
-  }
-
-  return brhs;
-}
-
-void BCMatrixEquations::adjustBCSolutionEquations(BCValuesPtr brhs,
-                                                  HYPRE_Complex* solution) {
-
-  for (HYPRE_Int bnum = 0; bnum < nb; bnum++) {
-    HYPRE_Int binum = binum_array[bnum];
-    HYPRE_Int bjnum = bjnum_array[bnum];
-    solution[binum] =
-        (brhs->data[bnum] - bij_array[bnum] * solution[bjnum]) / bii_array[bnum];
-  }
-}
-
-} // namespace bout
-
-#endif // BOUT_HAS_HYPRE
diff --git a/tests/integrated/test-laplace-hypre3d/runtest b/tests/integrated/test-laplace-hypre3d/runtest
index 89acf79364..b50c5993b7 100755
--- a/tests/integrated/test-laplace-hypre3d/runtest
+++ b/tests/integrated/test-laplace-hypre3d/runtest
@@ -19,24 +19,20 @@ build_and_log("Laplace 3D with Hypre")
 
 success = True
 for directory, nproc in test_directories:
-    command = "./test-laplace3d -d " + directory
+    command = "test-laplace3d -d " + directory
     print("running on", nproc, "processors:", command)
-    s, out = launch_safe(command, nproc=nproc, pipe=True)
-    # Save output to log file
-    with open("run.log." + directory, "w") as f:
-        f.write(out)
+    launch_safe(command, nproc=nproc)
 
     error_max = collect("error_max", path=directory, info=False)
 
     if error_max > tolerance:
-        print(f" => {directory} failed with maximum error {error_max}")
+        print(directory + " failed with maximum error {}".format(error_max))
         success = False
     else:
-        print(f" => {directory} passed with maximum error {error_max}")
+        print(directory + " passed with maximum error {}".format(error_max))
 
 if success:
-    print("=> All passed")
+    print("All passed")
     exit(0)
 else:
-    print("=> Some tests failed")
     exit(1)

From c6ad498df7ea672aabb10665b5f30b9d64b31d0f Mon Sep 17 00:00:00 2001
From: Ben Dudson <dudson2@llnl.gov>
Date: Sun, 29 Jun 2025 14:26:41 -0700
Subject: [PATCH 100/129] Handle absolute paths to options file

The command line switch -f specifies the path to the BOUT.inp file.
Previously this was always concatenated with the data directory.
Now treats paths with leading '/' as absolute paths.

With C++17 this can be replaced by `std::filesystem` paths.
---
 src/bout++.cxx | 10 ++++++++--
 1 file changed, 8 insertions(+), 2 deletions(-)

diff --git a/src/bout++.cxx b/src/bout++.cxx
index 7f23cf5f91..39f5468f07 100644
--- a/src/bout++.cxx
+++ b/src/bout++.cxx
@@ -84,7 +84,7 @@ const char DEFAULT_DIR[] = "data";
 // Define S_ISDIR if not defined by system headers (that is, MSVC)
 // Taken from https://github.com/curl/curl/blob/e59540139a398dc70fde6aec487b19c5085105af/lib/curl_setup.h#L748-L751
 #if !defined(S_ISDIR) && defined(S_IFMT) && defined(S_IFDIR)
-#define S_ISDIR(m) (((m)&S_IFMT) == S_IFDIR)
+#define S_ISDIR(m) (((m) & S_IFMT) == S_IFDIR)
 #endif
 
 #ifdef _MSC_VER
@@ -180,7 +180,13 @@ int BoutInitialise(int& argc, char**& argv) {
     // `optionfile` here, but we'd need to call parseCommandLine
     // _first_ in order to do that and set the source, etc., but we
     // need to call that _second_ in order to override the input file
-    reader->read(Options::getRoot(), "{}/{}", args.data_dir, args.opt_file);
+    if (args.opt_file[0] == '/') {
+      // Absolute path
+      reader->read(Options::getRoot(), "{}", args.opt_file);
+    } else {
+      // Join paths. In C++17 this could be done using std::filesystem
+      reader->read(Options::getRoot(), "{}/{}", args.data_dir, args.opt_file);
+    }
 
     // Get options override from command-line
     reader->parseCommandLine(Options::getRoot(), args.argv);

From 7c2c6543d871f2e9144eb21d0cd9031eed530d3f Mon Sep 17 00:00:00 2001
From: Peter Hill <peter.hill@york.ac.uk>
Date: Wed, 2 Jul 2025 11:04:43 +0100
Subject: [PATCH 101/129] Fix name clash in some examples and MMS tests

`FieldFactory` expects an `input` section, so this cannot be used as a
variable name in the input file
---
 examples/laplacexy/laplace_perp/square/BOUT.inp | 2 +-
 examples/laplacexy/laplace_perp/test.cxx        | 2 +-
 examples/laplacexy/laplace_perp/torus/BOUT.inp  | 2 +-
 tests/MMS/laplace/data/BOUT.inp                 | 2 +-
 tests/MMS/laplace/laplace.cxx                   | 6 ++++--
 tests/MMS/spatial/d2dx2/data/BOUT.inp           | 2 +-
 tests/MMS/spatial/d2dx2/test_d2dx2.cxx          | 2 +-
 tests/MMS/spatial/d2dz2/data/BOUT.inp           | 2 +-
 tests/MMS/spatial/d2dz2/test_d2dz2.cxx          | 2 +-
 9 files changed, 12 insertions(+), 10 deletions(-)

diff --git a/examples/laplacexy/laplace_perp/square/BOUT.inp b/examples/laplacexy/laplace_perp/square/BOUT.inp
index 95ecb7119f..38fb175d90 100644
--- a/examples/laplacexy/laplace_perp/square/BOUT.inp
+++ b/examples/laplacexy/laplace_perp/square/BOUT.inp
@@ -1,5 +1,5 @@
 
-input = sin(pi*x - y)
+input_field = sin(pi*x - y)
 
 non_uniform = true  # Include corrections to second derivatives
 
diff --git a/examples/laplacexy/laplace_perp/test.cxx b/examples/laplacexy/laplace_perp/test.cxx
index 1312b005da..8a9a99f92c 100644
--- a/examples/laplacexy/laplace_perp/test.cxx
+++ b/examples/laplacexy/laplace_perp/test.cxx
@@ -47,7 +47,7 @@ int main(int argc, char** argv) {
   ///////////////////////////////////////
 
   // Read an analytic input
-  Field2D input = FieldFactory::get()->create2D("input", Options::getRoot(), mesh);
+  Field2D input = FieldFactory::get()->create2D("input_field", Options::getRoot(), mesh);
 
   // Create a LaplaceXY solver
   LaplaceXY* laplacexy = new LaplaceXY(mesh);
diff --git a/examples/laplacexy/laplace_perp/torus/BOUT.inp b/examples/laplacexy/laplace_perp/torus/BOUT.inp
index 365294174f..4109b44bab 100644
--- a/examples/laplacexy/laplace_perp/torus/BOUT.inp
+++ b/examples/laplacexy/laplace_perp/torus/BOUT.inp
@@ -1,5 +1,5 @@
 
-input = sin(pi*x - y)
+input_field = sin(pi*x - y)
 calc_metric = true  # Read Rxy, Bpxy etc and calculate metric
 
 non_uniform = true  # Include corrections to second derivatives
diff --git a/tests/MMS/laplace/data/BOUT.inp b/tests/MMS/laplace/data/BOUT.inp
index 1965b1e8f7..5b3cc37b09 100644
--- a/tests/MMS/laplace/data/BOUT.inp
+++ b/tests/MMS/laplace/data/BOUT.inp
@@ -5,7 +5,7 @@ MXG = 1
 
 
 solution = sin(pi*x)
-input = -pi^2*sin(pi*x)
+input_field = -pi^2*sin(pi*x)
 
 [mesh]
 
diff --git a/tests/MMS/laplace/laplace.cxx b/tests/MMS/laplace/laplace.cxx
index 54dbaaba67..e81ca64fa1 100644
--- a/tests/MMS/laplace/laplace.cxx
+++ b/tests/MMS/laplace/laplace.cxx
@@ -5,6 +5,7 @@
 #include <bout/invert_laplace.hxx>
 
 using bout::globals::mesh;
+using namespace std::string_literals;
 
 int main(int argc, char** argv) {
   int init_err = BoutInitialise(argc, argv);
@@ -31,10 +32,11 @@ int main(int argc, char** argv) {
 
   FieldFactory fact(mesh);
 
-  std::shared_ptr<FieldGenerator> gen = fact.parse("input");
+  const auto input_name = "input_field"s;
+  std::shared_ptr<FieldGenerator> gen = fact.parse(input_name);
   output << "GEN = " << gen->str() << endl;
 
-  Field3D input = fact.create3D("input");
+  Field3D input = fact.create3D(input_name);
 
   Field3D result = lap->solve(input);
 
diff --git a/tests/MMS/spatial/d2dx2/data/BOUT.inp b/tests/MMS/spatial/d2dx2/data/BOUT.inp
index 5c1deaf0af..cdc0d96139 100644
--- a/tests/MMS/spatial/d2dx2/data/BOUT.inp
+++ b/tests/MMS/spatial/d2dx2/data/BOUT.inp
@@ -5,7 +5,7 @@ MXG = 1
 
 MYG = 1  # No guard cells in Y
 
-input = sin(0.5*pi*x)
+input_field = sin(0.5*pi*x)
 solution = -sin(0.5*pi*x) * 0.25*pi*pi
 
 [mesh]
diff --git a/tests/MMS/spatial/d2dx2/test_d2dx2.cxx b/tests/MMS/spatial/d2dx2/test_d2dx2.cxx
index 6b35b719e1..228dca4b2a 100644
--- a/tests/MMS/spatial/d2dx2/test_d2dx2.cxx
+++ b/tests/MMS/spatial/d2dx2/test_d2dx2.cxx
@@ -12,7 +12,7 @@ int main(int argc, char** argv) {
 
   BoutInitialise(argc, argv);
 
-  Field3D input = FieldFactory::get()->create3D("input", Options::getRoot(), mesh);
+  Field3D input = FieldFactory::get()->create3D("input_field", Options::getRoot(), mesh);
   Field3D solution = FieldFactory::get()->create3D("solution", Options::getRoot(), mesh);
   // At this point the boundary cells are set to the analytic solution
 
diff --git a/tests/MMS/spatial/d2dz2/data/BOUT.inp b/tests/MMS/spatial/d2dz2/data/BOUT.inp
index 6618d6f574..640411c112 100644
--- a/tests/MMS/spatial/d2dz2/data/BOUT.inp
+++ b/tests/MMS/spatial/d2dz2/data/BOUT.inp
@@ -5,7 +5,7 @@ zperiod = 1
 MXG = 0  # No guard cells in X
 MYG = 1  # No guard cells in Y
 
-input = sin(z)
+input_field = sin(z)
 solution = -sin(z)
 
 [mesh]
diff --git a/tests/MMS/spatial/d2dz2/test_d2dz2.cxx b/tests/MMS/spatial/d2dz2/test_d2dz2.cxx
index 0b7aa2cde4..9dccb6a992 100644
--- a/tests/MMS/spatial/d2dz2/test_d2dz2.cxx
+++ b/tests/MMS/spatial/d2dz2/test_d2dz2.cxx
@@ -12,7 +12,7 @@ int main(int argc, char** argv) {
 
   BoutInitialise(argc, argv);
 
-  Field3D input = FieldFactory::get()->create3D("input", Options::getRoot(), mesh);
+  Field3D input = FieldFactory::get()->create3D("input_field", Options::getRoot(), mesh);
   Field3D solution = FieldFactory::get()->create3D("solution", Options::getRoot(), mesh);
 
   Field3D result = D2DZ2(input);

From 824d095d101789137460559cd29ac6d7e62190f0 Mon Sep 17 00:00:00 2001
From: Peter Hill <peter.hill@york.ac.uk>
Date: Wed, 2 Jul 2025 11:07:12 +0100
Subject: [PATCH 102/129] Fix some clang-tidy warnings

---
 examples/laplacexy/laplace_perp/test.cxx | 14 +++++++++-----
 tests/MMS/laplace/laplace.cxx            |  5 +++--
 2 files changed, 12 insertions(+), 7 deletions(-)

diff --git a/examples/laplacexy/laplace_perp/test.cxx b/examples/laplacexy/laplace_perp/test.cxx
index 8a9a99f92c..291faffabc 100644
--- a/examples/laplacexy/laplace_perp/test.cxx
+++ b/examples/laplacexy/laplace_perp/test.cxx
@@ -10,11 +10,15 @@ int main(int argc, char** argv) {
   BoutInitialise(argc, argv);
 
   ///////////////////////////////////////
-  bool calc_metric;
-  calc_metric = Options::root()["calc_metric"].withDefault(false);
+  const bool calc_metric = Options::root()["calc_metric"].withDefault(false);
   if (calc_metric) {
     // Read metric tensor
-    Field2D Rxy, Btxy, Bpxy, B0, hthe, I;
+    Field2D Rxy;
+    Field2D Btxy;
+    Field2D Bpxy;
+    Field2D B0;
+    Field2D hthe;
+    Field2D I;
     mesh->get(Rxy, "Rxy");   // m
     mesh->get(Btxy, "Btxy"); // T
     mesh->get(Bpxy, "Bpxy"); // T
@@ -50,10 +54,10 @@ int main(int argc, char** argv) {
   Field2D input = FieldFactory::get()->create2D("input_field", Options::getRoot(), mesh);
 
   // Create a LaplaceXY solver
-  LaplaceXY* laplacexy = new LaplaceXY(mesh);
+  LaplaceXY laplacexy{mesh};
 
   // Solve, using 0.0 as starting guess
-  Field2D solved = laplacexy->solve(input, 0.0);
+  Field2D solved = laplacexy.solve(input, 0.0);
 
   // Need to communicate guard cells
   mesh->communicate(solved);
diff --git a/tests/MMS/laplace/laplace.cxx b/tests/MMS/laplace/laplace.cxx
index e81ca64fa1..15fc849d8f 100644
--- a/tests/MMS/laplace/laplace.cxx
+++ b/tests/MMS/laplace/laplace.cxx
@@ -11,7 +11,8 @@ int main(int argc, char** argv) {
   int init_err = BoutInitialise(argc, argv);
   if (init_err < 0) {
     return 0;
-  } else if (init_err > 0) {
+  }
+  if (init_err > 0) {
     return init_err;
   }
 
@@ -34,7 +35,7 @@ int main(int argc, char** argv) {
 
   const auto input_name = "input_field"s;
   std::shared_ptr<FieldGenerator> gen = fact.parse(input_name);
-  output << "GEN = " << gen->str() << endl;
+  output.write("GEN = {}\n", gen->str());
 
   Field3D input = fact.create3D(input_name);
 

From 90f7b033bc117271ae5fef19eb03d4bba42545e8 Mon Sep 17 00:00:00 2001
From: Ben Dudson <dudson2@llnl.gov>
Date: Wed, 2 Jul 2025 17:14:20 -0700
Subject: [PATCH 103/129] Use std::filesystem::path for inputs

C++17 feature. Should enable more robust handling of system paths.
---
 include/bout/bout.hxx | 10 ++++++----
 src/bout++.cxx        | 10 ++--------
 2 files changed, 8 insertions(+), 12 deletions(-)

diff --git a/include/bout/bout.hxx b/include/bout/bout.hxx
index 8588fe56d9..a08696ec66 100644
--- a/include/bout/bout.hxx
+++ b/include/bout/bout.hxx
@@ -34,6 +34,8 @@
 #ifndef BOUT_H
 #define BOUT_H
 
+#include <filesystem> // std::filesystem (C++17)
+
 // IWYU pragma: begin_keep, begin_export
 #include "bout/build_defines.hxx"
 
@@ -106,10 +108,10 @@ void setupGetText();
 struct CommandLineArgs {
   int verbosity{4};
   bool color_output{false};
-  std::string data_dir{"data"};          ///< Directory for data input/output
-  std::string opt_file{"BOUT.inp"};      ///< Filename for the options file
-  std::string set_file{"BOUT.settings"}; ///< Filename for the options file
-  std::string log_file{"BOUT.log"};      ///< File name for the log file
+  std::filesystem::path data_dir{"data"};          ///< Directory for data input/output
+  std::filesystem::path opt_file{"BOUT.inp"};      ///< Filename for the options file
+  std::filesystem::path set_file{"BOUT.settings"}; ///< Filename for the options file
+  std::filesystem::path log_file{"BOUT.log"};      ///< File name for the log file
   /// The original set of command line arguments
   std::vector<std::string> original_argv;
   /// The "canonicalised" command line arguments, with single-letter
diff --git a/src/bout++.cxx b/src/bout++.cxx
index 39f5468f07..6de1c5713b 100644
--- a/src/bout++.cxx
+++ b/src/bout++.cxx
@@ -4,7 +4,7 @@
  * Adapted from the BOUT code by B.Dudson, University of York, Oct 2007
  *
  **************************************************************************
- * Copyright 2010-2023 BOUT++ contributors
+ * Copyright 2010-2025 BOUT++ contributors
  *
  * Contact Ben Dudson, dudson2@llnl.gov
  *
@@ -180,13 +180,7 @@ int BoutInitialise(int& argc, char**& argv) {
     // `optionfile` here, but we'd need to call parseCommandLine
     // _first_ in order to do that and set the source, etc., but we
     // need to call that _second_ in order to override the input file
-    if (args.opt_file[0] == '/') {
-      // Absolute path
-      reader->read(Options::getRoot(), "{}", args.opt_file);
-    } else {
-      // Join paths. In C++17 this could be done using std::filesystem
-      reader->read(Options::getRoot(), "{}/{}", args.data_dir, args.opt_file);
-    }
+    reader->read(Options::getRoot(), "{}", (args.data_dir / args.opt_file).string());
 
     // Get options override from command-line
     reader->parseCommandLine(Options::getRoot(), args.argv);

From 5f0720a5b7831568089118c9bba75ee20006a2c6 Mon Sep 17 00:00:00 2001
From: malamast <malamas.tsagkaridis@gmail.com>
Date: Wed, 2 Jul 2025 18:15:03 -0700
Subject: [PATCH 104/129] SNES solver: Added a PID controller to update the
 timestep of the backward euler SNES solver.

The user sets target_its a desired number of nonlinear iterations and the timestep is updated based on the ratio of that number and the actual number on nonlinear iteration of each Newton step. The exponent can be tuned to the problem needs. A smaller exponent results in smaller changes of dt.
---
 src/solver/impls/snes/snes.cxx | 144 +++++++++++++++++++++++++--------
 src/solver/impls/snes/snes.hxx |  14 ++++
 2 files changed, 125 insertions(+), 33 deletions(-)

diff --git a/src/solver/impls/snes/snes.cxx b/src/solver/impls/snes/snes.cxx
index 15099f9e2a..8b0b09fea2 100644
--- a/src/solver/impls/snes/snes.cxx
+++ b/src/solver/impls/snes/snes.cxx
@@ -118,6 +118,9 @@ SNESSolver::SNESSolver(Options* opts)
       maxits((*options)["max_nonlinear_iterations"]
                  .doc("Maximum number of nonlinear iterations per SNES solve")
                  .withDefault(50)),
+      maxf((*options)["maxf"]
+                 .doc("Maximum number of function evaluations per SNES solve")
+                 .withDefault(10000)),                 
       lower_its((*options)["lower_its"]
                     .doc("Iterations below which the next timestep is increased")
                     .withDefault(static_cast<int>(maxits * 0.5))),
@@ -133,6 +136,17 @@ SNESSolver::SNESSolver(Options* opts)
       timestep_factor_on_lower_its((*options)["timestep_factor_on_lower_its"]
                                    .doc("Multiply timestep if iterations are below lower_its")
                                    .withDefault(1.4)),
+      pidController(
+          (*options)["pidController"].doc("Use PID controller?").withDefault(false)),
+      target_its((*options)["target_its"]
+                    .doc("Target snes iterations")
+                    .withDefault(static_cast<int>(7))),
+      kP((*options)["kP"].doc("Proportional PID parameter")
+                         .withDefault(0.7)),
+      kI((*options)["kI"].doc("Integral PID parameter")
+                         .withDefault(0.3)),
+      kD((*options)["kD"].doc("Derivative PID parameter")
+                         .withDefault(0.2)),   
       diagnose(
           (*options)["diagnose"].doc("Print additional diagnostics").withDefault(false)),
       diagnose_failures((*options)["diagnose_failures"]
@@ -632,14 +646,21 @@ int SNESSolver::init() {
     // Note: If the 'Amat' Jacobian is matrix free, SNESComputeJacobian
     //       always updates its reference 'u' vector every nonlinear iteration
     SNESSetLagJacobian(snes, lag_jacobian);
-    // Set Jacobian and preconditioner to persist across time steps
-    SNESSetLagJacobianPersists(snes, PETSC_TRUE);
-    SNESSetLagPreconditionerPersists(snes, PETSC_TRUE);
+    if (pidController){
+      nl_its_prev = target_its;
+      nl_its_prev2 = target_its;
+      SNESSetLagJacobianPersists(snes, PETSC_FALSE);
+      SNESSetLagPreconditionerPersists(snes, PETSC_FALSE);
+    } else {
+      // Set Jacobian and preconditioner to persist across time steps
+      SNESSetLagJacobianPersists(snes, PETSC_TRUE);
+      SNESSetLagPreconditionerPersists(snes, PETSC_TRUE);
+    }
     SNESSetLagPreconditioner(snes, 1); // Rebuild when Jacobian is rebuilt
   }
 
   // Set tolerances
-  SNESSetTolerances(snes, atol, rtol, stol, maxits, PETSC_DEFAULT);
+  SNESSetTolerances(snes, atol, rtol, stol, maxits, maxf);
 
   // Force SNES to take at least one nonlinear iteration.
   // This may prevent the solver from getting stuck in false steady state conditions
@@ -843,6 +864,11 @@ int SNESSolver::run() {
         VecAXPBY(snes_x, -beta, (1. + beta), x1);
       }
 
+
+      if (pidController){
+        SNESSetLagJacobian(snes, lag_jacobian);
+      }
+
       // Run the solver
       PetscErrorCode ierr = SNESSolve(snes, nullptr, snes_x);
 
@@ -900,6 +926,7 @@ int SNESSolver::run() {
           updateColoring();
           jacobian_pruned = false; // Reset flag. Will be set after pruning.
         }
+
         if (saved_jacobian_lag == 0) {
           // This triggers a Jacobian recalculation
           SNESGetLagJacobian(snes, &saved_jacobian_lag);
@@ -1033,45 +1060,67 @@ int SNESSolver::run() {
 #endif // PETSC_VERSION_GE(3,20,0)
 
       if (looping) {
-        // Consider changing the timestep.
-        // Note: The preconditioner depends on the timestep,
-        // so if it is not recalculated the it will be less
-        // effective.
-        if ((nl_its <= lower_its) && (timestep < max_timestep)
-            && (steps_since_snes_failure > 2)) {
-          // Increase timestep slightly
-          timestep *= timestep_factor_on_lower_its;
-
-          if (timestep > max_timestep) {
-            timestep = max_timestep;
+
+        if (pidController){
+          // Changing the timestep.
+          // Note: The preconditioner depends on the timestep,
+          // so we recalculate the jacobian and the preconditioner
+          //  every time the timestep changes
+
+          timestep = pid(timestep, nl_its);
+
+          // NOTE(malamast): Do we really need this?
+          // Recompute Jacobian (for now)
+          if (saved_jacobian_lag == 0) {
+            SNESGetLagJacobian(snes, &saved_jacobian_lag);
+            SNESSetLagJacobian(snes, 1);
           }
 
-          // Note: Setting the SNESJacobianFn to NULL retains
-          // previously set evaluation function.
-          //
-          // The SNES Jacobian is a combination of the RHS Jacobian
-          // and a factor involving the timestep.
-          // Depends on equation_form
-          // -> Probably call SNESSetJacobian(snes, Jfd, Jfd, NULL, fdcoloring);
 
-          if (static_cast<BoutReal>(lin_its) / nl_its > 4) {
-            // Recompute Jacobian (for now)
+        } else {
+          
+          // Consider changing the timestep.
+          // Note: The preconditioner depends on the timestep,
+          // so if it is not recalculated the it will be less
+          // effective.
+          if ((nl_its <= lower_its) && (timestep < max_timestep)
+              && (steps_since_snes_failure > 2)) {
+            // Increase timestep slightly
+            timestep *= timestep_factor_on_lower_its;
+
+            if (timestep > max_timestep) {
+              timestep = max_timestep;
+            }
+
+            // Note: Setting the SNESJacobianFn to NULL retains
+            // previously set evaluation function.
+            //
+            // The SNES Jacobian is a combination of the RHS Jacobian
+            // and a factor involving the timestep.
+            // Depends on equation_form
+            // -> Probably call SNESSetJacobian(snes, Jfd, Jfd, NULL, fdcoloring);
+
+            if (static_cast<BoutReal>(lin_its) / nl_its > 4) {
+              // Recompute Jacobian (for now)
+              if (saved_jacobian_lag == 0) {
+                SNESGetLagJacobian(snes, &saved_jacobian_lag);
+                SNESSetLagJacobian(snes, 1);
+              }
+            }
+
+          } else if (nl_its >= upper_its) {
+            // Reduce timestep slightly
+            timestep *= timestep_factor_on_upper_its;
+
+            // Recompute Jacobian
             if (saved_jacobian_lag == 0) {
               SNESGetLagJacobian(snes, &saved_jacobian_lag);
               SNESSetLagJacobian(snes, 1);
             }
           }
 
-        } else if (nl_its >= upper_its) {
-          // Reduce timestep slightly
-          timestep *= timestep_factor_on_upper_its;
-
-          // Recompute Jacobian
-          if (saved_jacobian_lag == 0) {
-            SNESGetLagJacobian(snes, &saved_jacobian_lag);
-            SNESSetLagJacobian(snes, 1);
-          }
         }
+
       }
       snes_failures = 0;
     } while (looping);
@@ -1386,4 +1435,33 @@ void SNESSolver::updateColoring() {
   }
 }
 
+
+BoutReal SNESSolver::pid(BoutReal timestep, int nl_its) {
+
+  /* ---------- multiplicative PID factors ---------- */
+  BoutReal facP = std::pow(double(target_its) / double(nl_its),  kP);
+  BoutReal facI = std::pow(double(nl_its_prev) / double(nl_its), kI);
+  BoutReal facD = std::pow(double(nl_its_prev) * double(nl_its_prev)  / double(nl_its) / double(nl_its_prev2),  kD);
+
+  // clamp groth factor to avoid huge changes
+  BoutReal fac = facP * facI * facD;
+  if (fac < 0.2)
+    fac = 0.2;
+  else if (fac > 5.0)
+    fac = 5.0;
+
+  /* ---------- update timestep and history ---------- */
+  BoutReal dt_new = timestep * fac;
+
+  if (dt_new > max_timestep) {
+    dt_new = max_timestep;
+  }
+
+  nl_its_prev2 = nl_its_prev;
+  nl_its_prev  = static_cast<int>(nl_its);
+
+  return dt_new;
+}
+
+
 #endif // BOUT_HAS_PETSC
diff --git a/src/solver/impls/snes/snes.hxx b/src/solver/impls/snes/snes.hxx
index cba2352582..02e2368d71 100644
--- a/src/solver/impls/snes/snes.hxx
+++ b/src/solver/impls/snes/snes.hxx
@@ -98,6 +98,7 @@ private:
   BoutReal atol; ///< Absolute tolerance
   BoutReal rtol; ///< Relative tolerance
   BoutReal stol; ///< Convergence tolerance
+  int maxf;                 ///< Maximum number of function evaluations allowed in the solver (default: 10000)
 
   int maxits;               ///< Maximum nonlinear iterations
   int lower_its, upper_its; ///< Limits on iterations for timestep adjustment
@@ -106,6 +107,19 @@ private:
   BoutReal timestep_factor_on_upper_its;
   BoutReal timestep_factor_on_lower_its;
 
+  ///< PID controller parameters
+  bool pidController;  ///< Use PID controller?
+  int target_its;  ///< Target number of nonlinear iterations for the PID controller.
+  ///< Use with caution! Not tested values. 
+  BoutReal kP; ///< (0.6 - 0.8) Proportional parameter (main response to current step)
+  BoutReal kI; ///< (0.2 - 0.4) Integral parameter (smooths history of changes)
+  BoutReal kD; ///< (0.1 - 0.3) Derivative (dampens oscillation - optional) 
+
+  int nl_its_prev;
+  int nl_its_prev2;
+
+  BoutReal pid(BoutReal timestep, int nl_its); ///< Updates the timestep
+
   bool diagnose;          ///< Output additional diagnostics
   bool diagnose_failures; ///< Print diagnostics on SNES failures
 

From 656dbdcf6120810c5abc3e24a7e6ba507e398c12 Mon Sep 17 00:00:00 2001
From: malamast <42969991+malamast@users.noreply.github.com>
Date: Thu, 3 Jul 2025 02:28:18 +0000
Subject: [PATCH 105/129] Apply clang-format changes

---
 src/solver/impls/snes/snes.cxx | 57 ++++++++++++++++------------------
 src/solver/impls/snes/snes.hxx | 10 +++---
 2 files changed, 31 insertions(+), 36 deletions(-)

diff --git a/src/solver/impls/snes/snes.cxx b/src/solver/impls/snes/snes.cxx
index 8b0b09fea2..8b763acf13 100644
--- a/src/solver/impls/snes/snes.cxx
+++ b/src/solver/impls/snes/snes.cxx
@@ -119,8 +119,8 @@ SNESSolver::SNESSolver(Options* opts)
                  .doc("Maximum number of nonlinear iterations per SNES solve")
                  .withDefault(50)),
       maxf((*options)["maxf"]
-                 .doc("Maximum number of function evaluations per SNES solve")
-                 .withDefault(10000)),                 
+               .doc("Maximum number of function evaluations per SNES solve")
+               .withDefault(10000)),
       lower_its((*options)["lower_its"]
                     .doc("Iterations below which the next timestep is increased")
                     .withDefault(static_cast<int>(maxits * 0.5))),
@@ -128,25 +128,24 @@ SNESSolver::SNESSolver(Options* opts)
                     .doc("Iterations above which the next timestep is reduced")
                     .withDefault(static_cast<int>(maxits * 0.8))),
       timestep_factor_on_failure((*options)["timestep_factor_on_failure"]
-                                 .doc("Multiply timestep on convergence failure")
-                                 .withDefault(0.5)),
-      timestep_factor_on_upper_its((*options)["timestep_factor_on_upper_its"]
-                                   .doc("Multiply timestep if iterations exceed upper_its")
-                                   .withDefault(0.9)),
-      timestep_factor_on_lower_its((*options)["timestep_factor_on_lower_its"]
-                                   .doc("Multiply timestep if iterations are below lower_its")
-                                   .withDefault(1.4)),
+                                     .doc("Multiply timestep on convergence failure")
+                                     .withDefault(0.5)),
+      timestep_factor_on_upper_its(
+          (*options)["timestep_factor_on_upper_its"]
+              .doc("Multiply timestep if iterations exceed upper_its")
+              .withDefault(0.9)),
+      timestep_factor_on_lower_its(
+          (*options)["timestep_factor_on_lower_its"]
+              .doc("Multiply timestep if iterations are below lower_its")
+              .withDefault(1.4)),
       pidController(
           (*options)["pidController"].doc("Use PID controller?").withDefault(false)),
       target_its((*options)["target_its"]
-                    .doc("Target snes iterations")
-                    .withDefault(static_cast<int>(7))),
-      kP((*options)["kP"].doc("Proportional PID parameter")
-                         .withDefault(0.7)),
-      kI((*options)["kI"].doc("Integral PID parameter")
-                         .withDefault(0.3)),
-      kD((*options)["kD"].doc("Derivative PID parameter")
-                         .withDefault(0.2)),   
+                     .doc("Target snes iterations")
+                     .withDefault(static_cast<int>(7))),
+      kP((*options)["kP"].doc("Proportional PID parameter").withDefault(0.7)),
+      kI((*options)["kI"].doc("Integral PID parameter").withDefault(0.3)),
+      kD((*options)["kD"].doc("Derivative PID parameter").withDefault(0.2)),
       diagnose(
           (*options)["diagnose"].doc("Print additional diagnostics").withDefault(false)),
       diagnose_failures((*options)["diagnose_failures"]
@@ -646,7 +645,7 @@ int SNESSolver::init() {
     // Note: If the 'Amat' Jacobian is matrix free, SNESComputeJacobian
     //       always updates its reference 'u' vector every nonlinear iteration
     SNESSetLagJacobian(snes, lag_jacobian);
-    if (pidController){
+    if (pidController) {
       nl_its_prev = target_its;
       nl_its_prev2 = target_its;
       SNESSetLagJacobianPersists(snes, PETSC_FALSE);
@@ -864,8 +863,7 @@ int SNESSolver::run() {
         VecAXPBY(snes_x, -beta, (1. + beta), x1);
       }
 
-
-      if (pidController){
+      if (pidController) {
         SNESSetLagJacobian(snes, lag_jacobian);
       }
 
@@ -1061,7 +1059,7 @@ int SNESSolver::run() {
 
       if (looping) {
 
-        if (pidController){
+        if (pidController) {
           // Changing the timestep.
           // Note: The preconditioner depends on the timestep,
           // so we recalculate the jacobian and the preconditioner
@@ -1076,9 +1074,8 @@ int SNESSolver::run() {
             SNESSetLagJacobian(snes, 1);
           }
 
-
         } else {
-          
+
           // Consider changing the timestep.
           // Note: The preconditioner depends on the timestep,
           // so if it is not recalculated the it will be less
@@ -1118,9 +1115,7 @@ int SNESSolver::run() {
               SNESSetLagJacobian(snes, 1);
             }
           }
-
         }
-
       }
       snes_failures = 0;
     } while (looping);
@@ -1435,13 +1430,14 @@ void SNESSolver::updateColoring() {
   }
 }
 
-
 BoutReal SNESSolver::pid(BoutReal timestep, int nl_its) {
 
   /* ---------- multiplicative PID factors ---------- */
-  BoutReal facP = std::pow(double(target_its) / double(nl_its),  kP);
+  BoutReal facP = std::pow(double(target_its) / double(nl_its), kP);
   BoutReal facI = std::pow(double(nl_its_prev) / double(nl_its), kI);
-  BoutReal facD = std::pow(double(nl_its_prev) * double(nl_its_prev)  / double(nl_its) / double(nl_its_prev2),  kD);
+  BoutReal facD = std::pow(double(nl_its_prev) * double(nl_its_prev) / double(nl_its)
+                               / double(nl_its_prev2),
+                           kD);
 
   // clamp groth factor to avoid huge changes
   BoutReal fac = facP * facI * facD;
@@ -1458,10 +1454,9 @@ BoutReal SNESSolver::pid(BoutReal timestep, int nl_its) {
   }
 
   nl_its_prev2 = nl_its_prev;
-  nl_its_prev  = static_cast<int>(nl_its);
+  nl_its_prev = static_cast<int>(nl_its);
 
   return dt_new;
 }
 
-
 #endif // BOUT_HAS_PETSC
diff --git a/src/solver/impls/snes/snes.hxx b/src/solver/impls/snes/snes.hxx
index 02e2368d71..8a0b5bcecb 100644
--- a/src/solver/impls/snes/snes.hxx
+++ b/src/solver/impls/snes/snes.hxx
@@ -98,7 +98,7 @@ private:
   BoutReal atol; ///< Absolute tolerance
   BoutReal rtol; ///< Relative tolerance
   BoutReal stol; ///< Convergence tolerance
-  int maxf;                 ///< Maximum number of function evaluations allowed in the solver (default: 10000)
+  int maxf; ///< Maximum number of function evaluations allowed in the solver (default: 10000)
 
   int maxits;               ///< Maximum nonlinear iterations
   int lower_its, upper_its; ///< Limits on iterations for timestep adjustment
@@ -108,12 +108,12 @@ private:
   BoutReal timestep_factor_on_lower_its;
 
   ///< PID controller parameters
-  bool pidController;  ///< Use PID controller?
-  int target_its;  ///< Target number of nonlinear iterations for the PID controller.
-  ///< Use with caution! Not tested values. 
+  bool pidController; ///< Use PID controller?
+  int target_its;     ///< Target number of nonlinear iterations for the PID controller.
+  ///< Use with caution! Not tested values.
   BoutReal kP; ///< (0.6 - 0.8) Proportional parameter (main response to current step)
   BoutReal kI; ///< (0.2 - 0.4) Integral parameter (smooths history of changes)
-  BoutReal kD; ///< (0.1 - 0.3) Derivative (dampens oscillation - optional) 
+  BoutReal kD; ///< (0.1 - 0.3) Derivative (dampens oscillation - optional)
 
   int nl_its_prev;
   int nl_its_prev2;

From 5a240c85eb6fa8bc22b0351342a50e7205517d4d Mon Sep 17 00:00:00 2001
From: Malamas Tsagkaridis <42969991+malamast@users.noreply.github.com>
Date: Mon, 7 Jul 2025 13:10:51 -0700
Subject: [PATCH 106/129] Update src/solver/impls/snes/snes.cxx

Code changes suggested by ZedThree

Co-authored-by: Peter Hill <peter.hill@york.ac.uk>
---
 src/solver/impls/snes/snes.cxx | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/solver/impls/snes/snes.cxx b/src/solver/impls/snes/snes.cxx
index 8b763acf13..678713f445 100644
--- a/src/solver/impls/snes/snes.cxx
+++ b/src/solver/impls/snes/snes.cxx
@@ -142,7 +142,7 @@ SNESSolver::SNESSolver(Options* opts)
           (*options)["pidController"].doc("Use PID controller?").withDefault(false)),
       target_its((*options)["target_its"]
                      .doc("Target snes iterations")
-                     .withDefault(static_cast<int>(7))),
+                     .withDefault(7)),
       kP((*options)["kP"].doc("Proportional PID parameter").withDefault(0.7)),
       kI((*options)["kI"].doc("Integral PID parameter").withDefault(0.3)),
       kD((*options)["kD"].doc("Derivative PID parameter").withDefault(0.2)),

From 9276da0e3fa50b7a9f613dabf011b018fa16004e Mon Sep 17 00:00:00 2001
From: malamast <42969991+malamast@users.noreply.github.com>
Date: Mon, 7 Jul 2025 20:12:06 +0000
Subject: [PATCH 107/129] Apply clang-format changes

---
 src/bout++.cxx                 | 2 +-
 src/solver/impls/snes/snes.cxx | 4 +---
 2 files changed, 2 insertions(+), 4 deletions(-)

diff --git a/src/bout++.cxx b/src/bout++.cxx
index 7f23cf5f91..4e9e37fe8d 100644
--- a/src/bout++.cxx
+++ b/src/bout++.cxx
@@ -84,7 +84,7 @@ const char DEFAULT_DIR[] = "data";
 // Define S_ISDIR if not defined by system headers (that is, MSVC)
 // Taken from https://github.com/curl/curl/blob/e59540139a398dc70fde6aec487b19c5085105af/lib/curl_setup.h#L748-L751
 #if !defined(S_ISDIR) && defined(S_IFMT) && defined(S_IFDIR)
-#define S_ISDIR(m) (((m)&S_IFMT) == S_IFDIR)
+#define S_ISDIR(m) (((m) & S_IFMT) == S_IFDIR)
 #endif
 
 #ifdef _MSC_VER
diff --git a/src/solver/impls/snes/snes.cxx b/src/solver/impls/snes/snes.cxx
index 678713f445..9906274a6e 100644
--- a/src/solver/impls/snes/snes.cxx
+++ b/src/solver/impls/snes/snes.cxx
@@ -140,9 +140,7 @@ SNESSolver::SNESSolver(Options* opts)
               .withDefault(1.4)),
       pidController(
           (*options)["pidController"].doc("Use PID controller?").withDefault(false)),
-      target_its((*options)["target_its"]
-                     .doc("Target snes iterations")
-                     .withDefault(7)),
+      target_its((*options)["target_its"].doc("Target snes iterations").withDefault(7)),
       kP((*options)["kP"].doc("Proportional PID parameter").withDefault(0.7)),
       kI((*options)["kI"].doc("Integral PID parameter").withDefault(0.3)),
       kD((*options)["kD"].doc("Derivative PID parameter").withDefault(0.2)),

From 210a6bc51499aaf39a01ee46ce4408b5909692da Mon Sep 17 00:00:00 2001
From: Malamas Tsagkaridis <42969991+malamast@users.noreply.github.com>
Date: Tue, 8 Jul 2025 11:34:07 -0700
Subject: [PATCH 108/129] Update src/solver/impls/snes/snes.cxx

Co-authored-by: Peter Hill <peter.hill@york.ac.uk>
---
 src/solver/impls/snes/snes.cxx | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/solver/impls/snes/snes.cxx b/src/solver/impls/snes/snes.cxx
index 9906274a6e..387c908cb8 100644
--- a/src/solver/impls/snes/snes.cxx
+++ b/src/solver/impls/snes/snes.cxx
@@ -1431,9 +1431,9 @@ void SNESSolver::updateColoring() {
 BoutReal SNESSolver::pid(BoutReal timestep, int nl_its) {
 
   /* ---------- multiplicative PID factors ---------- */
-  BoutReal facP = std::pow(double(target_its) / double(nl_its), kP);
-  BoutReal facI = std::pow(double(nl_its_prev) / double(nl_its), kI);
-  BoutReal facD = std::pow(double(nl_its_prev) * double(nl_its_prev) / double(nl_its)
+  const BoutReal facP = std::pow(double(target_its) / double(nl_its), kP);
+  const BoutReal facI = std::pow(double(nl_its_prev) / double(nl_its), kI);
+  const BoutReal facD = std::pow(double(nl_its_prev) * double(nl_its_prev) / double(nl_its)
                                / double(nl_its_prev2),
                            kD);
 

From e881832ad7d0d5447886b0787af8ab179d9c833d Mon Sep 17 00:00:00 2001
From: Malamas Tsagkaridis <42969991+malamast@users.noreply.github.com>
Date: Tue, 8 Jul 2025 11:34:26 -0700
Subject: [PATCH 109/129] Update src/solver/impls/snes/snes.cxx

Co-authored-by: Peter Hill <peter.hill@york.ac.uk>
---
 src/solver/impls/snes/snes.cxx | 8 ++------
 1 file changed, 2 insertions(+), 6 deletions(-)

diff --git a/src/solver/impls/snes/snes.cxx b/src/solver/impls/snes/snes.cxx
index 387c908cb8..a0f9c06801 100644
--- a/src/solver/impls/snes/snes.cxx
+++ b/src/solver/impls/snes/snes.cxx
@@ -1437,12 +1437,8 @@ BoutReal SNESSolver::pid(BoutReal timestep, int nl_its) {
                                / double(nl_its_prev2),
                            kD);
 
-  // clamp groth factor to avoid huge changes
-  BoutReal fac = facP * facI * facD;
-  if (fac < 0.2)
-    fac = 0.2;
-  else if (fac > 5.0)
-    fac = 5.0;
+  // clamp growth factor to avoid huge changes
+  const BoutReal fac = std::clamp(facP * facI * facD, 0.2, 5.0);
 
   /* ---------- update timestep and history ---------- */
   BoutReal dt_new = timestep * fac;

From 133980416d2b266e15a718b3ef045b7b355a37e4 Mon Sep 17 00:00:00 2001
From: Malamas Tsagkaridis <42969991+malamast@users.noreply.github.com>
Date: Tue, 8 Jul 2025 11:34:37 -0700
Subject: [PATCH 110/129] Update src/solver/impls/snes/snes.cxx

Co-authored-by: Peter Hill <peter.hill@york.ac.uk>
---
 src/solver/impls/snes/snes.cxx | 6 +-----
 1 file changed, 1 insertion(+), 5 deletions(-)

diff --git a/src/solver/impls/snes/snes.cxx b/src/solver/impls/snes/snes.cxx
index a0f9c06801..9d9a396c3c 100644
--- a/src/solver/impls/snes/snes.cxx
+++ b/src/solver/impls/snes/snes.cxx
@@ -1441,11 +1441,7 @@ BoutReal SNESSolver::pid(BoutReal timestep, int nl_its) {
   const BoutReal fac = std::clamp(facP * facI * facD, 0.2, 5.0);
 
   /* ---------- update timestep and history ---------- */
-  BoutReal dt_new = timestep * fac;
-
-  if (dt_new > max_timestep) {
-    dt_new = max_timestep;
-  }
+  const BoutReal dt_new = std::min(timestep * fac, max_timestep);
 
   nl_its_prev2 = nl_its_prev;
   nl_its_prev = static_cast<int>(nl_its);

From 687d21c5da8e40c68ff5d7306ae769a058ce9038 Mon Sep 17 00:00:00 2001
From: Malamas Tsagkaridis <42969991+malamast@users.noreply.github.com>
Date: Tue, 8 Jul 2025 11:34:47 -0700
Subject: [PATCH 111/129] Update src/solver/impls/snes/snes.cxx

Co-authored-by: Peter Hill <peter.hill@york.ac.uk>
---
 src/solver/impls/snes/snes.cxx | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/solver/impls/snes/snes.cxx b/src/solver/impls/snes/snes.cxx
index 9d9a396c3c..89910f1655 100644
--- a/src/solver/impls/snes/snes.cxx
+++ b/src/solver/impls/snes/snes.cxx
@@ -1444,7 +1444,7 @@ BoutReal SNESSolver::pid(BoutReal timestep, int nl_its) {
   const BoutReal dt_new = std::min(timestep * fac, max_timestep);
 
   nl_its_prev2 = nl_its_prev;
-  nl_its_prev = static_cast<int>(nl_its);
+  nl_its_prev = nl_its;
 
   return dt_new;
 }

From 0c8ef879a944b2d58fdbdc04ac74f69f2c37c33f Mon Sep 17 00:00:00 2001
From: Malamas Tsagkaridis <42969991+malamast@users.noreply.github.com>
Date: Tue, 8 Jul 2025 11:34:57 -0700
Subject: [PATCH 112/129] Update src/solver/impls/snes/snes.cxx

Co-authored-by: Peter Hill <peter.hill@york.ac.uk>
---
 src/solver/impls/snes/snes.cxx | 4 +---
 1 file changed, 1 insertion(+), 3 deletions(-)

diff --git a/src/solver/impls/snes/snes.cxx b/src/solver/impls/snes/snes.cxx
index 89910f1655..0b61320f34 100644
--- a/src/solver/impls/snes/snes.cxx
+++ b/src/solver/impls/snes/snes.cxx
@@ -1083,9 +1083,7 @@ int SNESSolver::run() {
             // Increase timestep slightly
             timestep *= timestep_factor_on_lower_its;
 
-            if (timestep > max_timestep) {
-              timestep = max_timestep;
-            }
+            timestep = std::min(timestep, max_timestep);
 
             // Note: Setting the SNESJacobianFn to NULL retains
             // previously set evaluation function.

From fd6f18943cf2d715a507ce50cb7ff702a21b6196 Mon Sep 17 00:00:00 2001
From: malamast <42969991+malamast@users.noreply.github.com>
Date: Tue, 8 Jul 2025 18:36:20 +0000
Subject: [PATCH 113/129] Apply clang-format changes

---
 src/solver/impls/snes/snes.cxx | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/solver/impls/snes/snes.cxx b/src/solver/impls/snes/snes.cxx
index 0b61320f34..e14d3d4569 100644
--- a/src/solver/impls/snes/snes.cxx
+++ b/src/solver/impls/snes/snes.cxx
@@ -1431,9 +1431,9 @@ BoutReal SNESSolver::pid(BoutReal timestep, int nl_its) {
   /* ---------- multiplicative PID factors ---------- */
   const BoutReal facP = std::pow(double(target_its) / double(nl_its), kP);
   const BoutReal facI = std::pow(double(nl_its_prev) / double(nl_its), kI);
-  const BoutReal facD = std::pow(double(nl_its_prev) * double(nl_its_prev) / double(nl_its)
-                               / double(nl_its_prev2),
-                           kD);
+  const BoutReal facD = std::pow(double(nl_its_prev) * double(nl_its_prev)
+                                     / double(nl_its) / double(nl_its_prev2),
+                                 kD);
 
   // clamp growth factor to avoid huge changes
   const BoutReal fac = std::clamp(facP * facI * facD, 0.2, 5.0);

From 8619876339753cc0c5f8c1b4810adb274a57fc26 Mon Sep 17 00:00:00 2001
From: malamast <malamas.tsagkaridis@gmail.com>
Date: Thu, 17 Jul 2025 09:56:23 -0700
Subject: [PATCH 114/129] snes: I addied some changes made on my remote branch
 by clang-tidy. I added the line
 MatSetOption(Jfd,MAT_KEEP_NONZERO_PATTERN,PETSC_TRUE); after the creation of
 Jfd to tell petsc to keep the pattern of the non zero elements in memory.
 Also, I changed the default coloring type to greedy which is more suited for
 large parallel problems.

---
 src/solver/impls/snes/snes.cxx | 82 +++++++++++++++++++++-------------
 1 file changed, 51 insertions(+), 31 deletions(-)

diff --git a/src/solver/impls/snes/snes.cxx b/src/solver/impls/snes/snes.cxx
index e14d3d4569..4f6c11fb42 100644
--- a/src/solver/impls/snes/snes.cxx
+++ b/src/solver/impls/snes/snes.cxx
@@ -119,8 +119,8 @@ SNESSolver::SNESSolver(Options* opts)
                  .doc("Maximum number of nonlinear iterations per SNES solve")
                  .withDefault(50)),
       maxf((*options)["maxf"]
-               .doc("Maximum number of function evaluations per SNES solve")
-               .withDefault(10000)),
+                 .doc("Maximum number of function evaluations per SNES solve")
+                 .withDefault(10000)),                 
       lower_its((*options)["lower_its"]
                     .doc("Iterations below which the next timestep is increased")
                     .withDefault(static_cast<int>(maxits * 0.5))),
@@ -128,22 +128,25 @@ SNESSolver::SNESSolver(Options* opts)
                     .doc("Iterations above which the next timestep is reduced")
                     .withDefault(static_cast<int>(maxits * 0.8))),
       timestep_factor_on_failure((*options)["timestep_factor_on_failure"]
-                                     .doc("Multiply timestep on convergence failure")
-                                     .withDefault(0.5)),
-      timestep_factor_on_upper_its(
-          (*options)["timestep_factor_on_upper_its"]
-              .doc("Multiply timestep if iterations exceed upper_its")
-              .withDefault(0.9)),
-      timestep_factor_on_lower_its(
-          (*options)["timestep_factor_on_lower_its"]
-              .doc("Multiply timestep if iterations are below lower_its")
-              .withDefault(1.4)),
+                                 .doc("Multiply timestep on convergence failure")
+                                 .withDefault(0.5)),
+      timestep_factor_on_upper_its((*options)["timestep_factor_on_upper_its"]
+                                   .doc("Multiply timestep if iterations exceed upper_its")
+                                   .withDefault(0.9)),
+      timestep_factor_on_lower_its((*options)["timestep_factor_on_lower_its"]
+                                   .doc("Multiply timestep if iterations are below lower_its")
+                                   .withDefault(1.4)),
       pidController(
           (*options)["pidController"].doc("Use PID controller?").withDefault(false)),
-      target_its((*options)["target_its"].doc("Target snes iterations").withDefault(7)),
-      kP((*options)["kP"].doc("Proportional PID parameter").withDefault(0.7)),
-      kI((*options)["kI"].doc("Integral PID parameter").withDefault(0.3)),
-      kD((*options)["kD"].doc("Derivative PID parameter").withDefault(0.2)),
+      target_its((*options)["target_its"]
+                    .doc("Target snes iterations")
+                    .withDefault(static_cast<int>(7))),
+      kP((*options)["kP"].doc("Proportional PID parameter")
+                         .withDefault(0.7)),
+      kI((*options)["kI"].doc("Integral PID parameter")
+                         .withDefault(0.3)),
+      kD((*options)["kD"].doc("Derivative PID parameter")
+                         .withDefault(0.2)),   
       diagnose(
           (*options)["diagnose"].doc("Print additional diagnostics").withDefault(false)),
       diagnose_failures((*options)["diagnose_failures"]
@@ -351,6 +354,7 @@ int SNESSolver::init() {
 
       // Set size of Matrix on each processor to nlocal x nlocal
       MatCreate(BoutComm::get(), &Jfd);
+      MatSetOption(Jfd,MAT_KEEP_NONZERO_PATTERN,PETSC_TRUE);
       MatSetSizes(Jfd, nlocal, nlocal, PETSC_DETERMINE, PETSC_DETERMINE);
       MatSetFromOptions(Jfd);
       // Determine which row/columns of the matrix are locally owned
@@ -643,7 +647,7 @@ int SNESSolver::init() {
     // Note: If the 'Amat' Jacobian is matrix free, SNESComputeJacobian
     //       always updates its reference 'u' vector every nonlinear iteration
     SNESSetLagJacobian(snes, lag_jacobian);
-    if (pidController) {
+    if (pidController){
       nl_its_prev = target_its;
       nl_its_prev2 = target_its;
       SNESSetLagJacobianPersists(snes, PETSC_FALSE);
@@ -861,7 +865,8 @@ int SNESSolver::run() {
         VecAXPBY(snes_x, -beta, (1. + beta), x1);
       }
 
-      if (pidController) {
+
+      if (pidController){
         SNESSetLagJacobian(snes, lag_jacobian);
       }
 
@@ -1057,7 +1062,7 @@ int SNESSolver::run() {
 
       if (looping) {
 
-        if (pidController) {
+        if (pidController){
           // Changing the timestep.
           // Note: The preconditioner depends on the timestep,
           // so we recalculate the jacobian and the preconditioner
@@ -1072,8 +1077,9 @@ int SNESSolver::run() {
             SNESSetLagJacobian(snes, 1);
           }
 
-        } else {
 
+        } else {
+          
           // Consider changing the timestep.
           // Note: The preconditioner depends on the timestep,
           // so if it is not recalculated the it will be less
@@ -1083,7 +1089,9 @@ int SNESSolver::run() {
             // Increase timestep slightly
             timestep *= timestep_factor_on_lower_its;
 
-            timestep = std::min(timestep, max_timestep);
+            if (timestep > max_timestep) {
+              timestep = max_timestep;
+            }
 
             // Note: Setting the SNESJacobianFn to NULL retains
             // previously set evaluation function.
@@ -1111,7 +1119,9 @@ int SNESSolver::run() {
               SNESSetLagJacobian(snes, 1);
             }
           }
+
         }
+
       }
       snes_failures = 0;
     } while (looping);
@@ -1400,7 +1410,9 @@ void SNESSolver::updateColoring() {
   // Re-calculate the coloring
   MatColoring coloring = NULL;
   MatColoringCreate(Jfd, &coloring);
-  MatColoringSetType(coloring, MATCOLORINGSL);
+  // MatColoringSetType(coloring, MATCOLORINGSL);  // Serial algorithm. Better for smale-to-medium size problems.
+  MatColoringSetType(coloring, MATCOLORINGGREEDY); // Parallel algorith. Better for large parallel runs
+  // MatColoringSetType(coloring, MATCOLORINGJP);  // This didn't work
   MatColoringSetFromOptions(coloring);
 
   // Calculate new index sets
@@ -1426,25 +1438,33 @@ void SNESSolver::updateColoring() {
   }
 }
 
+
 BoutReal SNESSolver::pid(BoutReal timestep, int nl_its) {
 
   /* ---------- multiplicative PID factors ---------- */
-  const BoutReal facP = std::pow(double(target_its) / double(nl_its), kP);
-  const BoutReal facI = std::pow(double(nl_its_prev) / double(nl_its), kI);
-  const BoutReal facD = std::pow(double(nl_its_prev) * double(nl_its_prev)
-                                     / double(nl_its) / double(nl_its_prev2),
-                                 kD);
+  BoutReal facP = std::pow(double(target_its) / double(nl_its),  kP);
+  BoutReal facI = std::pow(double(nl_its_prev) / double(nl_its), kI);
+  BoutReal facD = std::pow(double(nl_its_prev) * double(nl_its_prev)  / double(nl_its) / double(nl_its_prev2),  kD);
 
-  // clamp growth factor to avoid huge changes
-  const BoutReal fac = std::clamp(facP * facI * facD, 0.2, 5.0);
+  // clamp groth factor to avoid huge changes
+  BoutReal fac = facP * facI * facD;
+  if (fac < 0.2)
+    fac = 0.2;
+  else if (fac > 5.0)
+    fac = 5.0;
 
   /* ---------- update timestep and history ---------- */
-  const BoutReal dt_new = std::min(timestep * fac, max_timestep);
+  BoutReal dt_new = timestep * fac;
+
+  if (dt_new > max_timestep) {
+    dt_new = max_timestep;
+  }
 
   nl_its_prev2 = nl_its_prev;
-  nl_its_prev = nl_its;
+  nl_its_prev  = static_cast<int>(nl_its);
 
   return dt_new;
 }
 
+
 #endif // BOUT_HAS_PETSC

From c20863993e7e87565cecef5a16eb18a97ab9518a Mon Sep 17 00:00:00 2001
From: malamast <42969991+malamast@users.noreply.github.com>
Date: Thu, 17 Jul 2025 17:59:07 +0000
Subject: [PATCH 115/129] Apply clang-format changes

---
 src/solver/impls/snes/snes.cxx | 62 ++++++++++++++++------------------
 1 file changed, 29 insertions(+), 33 deletions(-)

diff --git a/src/solver/impls/snes/snes.cxx b/src/solver/impls/snes/snes.cxx
index 4f6c11fb42..0b57a52d39 100644
--- a/src/solver/impls/snes/snes.cxx
+++ b/src/solver/impls/snes/snes.cxx
@@ -119,8 +119,8 @@ SNESSolver::SNESSolver(Options* opts)
                  .doc("Maximum number of nonlinear iterations per SNES solve")
                  .withDefault(50)),
       maxf((*options)["maxf"]
-                 .doc("Maximum number of function evaluations per SNES solve")
-                 .withDefault(10000)),                 
+               .doc("Maximum number of function evaluations per SNES solve")
+               .withDefault(10000)),
       lower_its((*options)["lower_its"]
                     .doc("Iterations below which the next timestep is increased")
                     .withDefault(static_cast<int>(maxits * 0.5))),
@@ -128,25 +128,24 @@ SNESSolver::SNESSolver(Options* opts)
                     .doc("Iterations above which the next timestep is reduced")
                     .withDefault(static_cast<int>(maxits * 0.8))),
       timestep_factor_on_failure((*options)["timestep_factor_on_failure"]
-                                 .doc("Multiply timestep on convergence failure")
-                                 .withDefault(0.5)),
-      timestep_factor_on_upper_its((*options)["timestep_factor_on_upper_its"]
-                                   .doc("Multiply timestep if iterations exceed upper_its")
-                                   .withDefault(0.9)),
-      timestep_factor_on_lower_its((*options)["timestep_factor_on_lower_its"]
-                                   .doc("Multiply timestep if iterations are below lower_its")
-                                   .withDefault(1.4)),
+                                     .doc("Multiply timestep on convergence failure")
+                                     .withDefault(0.5)),
+      timestep_factor_on_upper_its(
+          (*options)["timestep_factor_on_upper_its"]
+              .doc("Multiply timestep if iterations exceed upper_its")
+              .withDefault(0.9)),
+      timestep_factor_on_lower_its(
+          (*options)["timestep_factor_on_lower_its"]
+              .doc("Multiply timestep if iterations are below lower_its")
+              .withDefault(1.4)),
       pidController(
           (*options)["pidController"].doc("Use PID controller?").withDefault(false)),
       target_its((*options)["target_its"]
-                    .doc("Target snes iterations")
-                    .withDefault(static_cast<int>(7))),
-      kP((*options)["kP"].doc("Proportional PID parameter")
-                         .withDefault(0.7)),
-      kI((*options)["kI"].doc("Integral PID parameter")
-                         .withDefault(0.3)),
-      kD((*options)["kD"].doc("Derivative PID parameter")
-                         .withDefault(0.2)),   
+                     .doc("Target snes iterations")
+                     .withDefault(static_cast<int>(7))),
+      kP((*options)["kP"].doc("Proportional PID parameter").withDefault(0.7)),
+      kI((*options)["kI"].doc("Integral PID parameter").withDefault(0.3)),
+      kD((*options)["kD"].doc("Derivative PID parameter").withDefault(0.2)),
       diagnose(
           (*options)["diagnose"].doc("Print additional diagnostics").withDefault(false)),
       diagnose_failures((*options)["diagnose_failures"]
@@ -354,7 +353,7 @@ int SNESSolver::init() {
 
       // Set size of Matrix on each processor to nlocal x nlocal
       MatCreate(BoutComm::get(), &Jfd);
-      MatSetOption(Jfd,MAT_KEEP_NONZERO_PATTERN,PETSC_TRUE);
+      MatSetOption(Jfd, MAT_KEEP_NONZERO_PATTERN, PETSC_TRUE);
       MatSetSizes(Jfd, nlocal, nlocal, PETSC_DETERMINE, PETSC_DETERMINE);
       MatSetFromOptions(Jfd);
       // Determine which row/columns of the matrix are locally owned
@@ -647,7 +646,7 @@ int SNESSolver::init() {
     // Note: If the 'Amat' Jacobian is matrix free, SNESComputeJacobian
     //       always updates its reference 'u' vector every nonlinear iteration
     SNESSetLagJacobian(snes, lag_jacobian);
-    if (pidController){
+    if (pidController) {
       nl_its_prev = target_its;
       nl_its_prev2 = target_its;
       SNESSetLagJacobianPersists(snes, PETSC_FALSE);
@@ -865,8 +864,7 @@ int SNESSolver::run() {
         VecAXPBY(snes_x, -beta, (1. + beta), x1);
       }
 
-
-      if (pidController){
+      if (pidController) {
         SNESSetLagJacobian(snes, lag_jacobian);
       }
 
@@ -1062,7 +1060,7 @@ int SNESSolver::run() {
 
       if (looping) {
 
-        if (pidController){
+        if (pidController) {
           // Changing the timestep.
           // Note: The preconditioner depends on the timestep,
           // so we recalculate the jacobian and the preconditioner
@@ -1077,9 +1075,8 @@ int SNESSolver::run() {
             SNESSetLagJacobian(snes, 1);
           }
 
-
         } else {
-          
+
           // Consider changing the timestep.
           // Note: The preconditioner depends on the timestep,
           // so if it is not recalculated the it will be less
@@ -1119,9 +1116,7 @@ int SNESSolver::run() {
               SNESSetLagJacobian(snes, 1);
             }
           }
-
         }
-
       }
       snes_failures = 0;
     } while (looping);
@@ -1411,7 +1406,8 @@ void SNESSolver::updateColoring() {
   MatColoring coloring = NULL;
   MatColoringCreate(Jfd, &coloring);
   // MatColoringSetType(coloring, MATCOLORINGSL);  // Serial algorithm. Better for smale-to-medium size problems.
-  MatColoringSetType(coloring, MATCOLORINGGREEDY); // Parallel algorith. Better for large parallel runs
+  MatColoringSetType(
+      coloring, MATCOLORINGGREEDY); // Parallel algorith. Better for large parallel runs
   // MatColoringSetType(coloring, MATCOLORINGJP);  // This didn't work
   MatColoringSetFromOptions(coloring);
 
@@ -1438,13 +1434,14 @@ void SNESSolver::updateColoring() {
   }
 }
 
-
 BoutReal SNESSolver::pid(BoutReal timestep, int nl_its) {
 
   /* ---------- multiplicative PID factors ---------- */
-  BoutReal facP = std::pow(double(target_its) / double(nl_its),  kP);
+  BoutReal facP = std::pow(double(target_its) / double(nl_its), kP);
   BoutReal facI = std::pow(double(nl_its_prev) / double(nl_its), kI);
-  BoutReal facD = std::pow(double(nl_its_prev) * double(nl_its_prev)  / double(nl_its) / double(nl_its_prev2),  kD);
+  BoutReal facD = std::pow(double(nl_its_prev) * double(nl_its_prev) / double(nl_its)
+                               / double(nl_its_prev2),
+                           kD);
 
   // clamp groth factor to avoid huge changes
   BoutReal fac = facP * facI * facD;
@@ -1461,10 +1458,9 @@ BoutReal SNESSolver::pid(BoutReal timestep, int nl_its) {
   }
 
   nl_its_prev2 = nl_its_prev;
-  nl_its_prev  = static_cast<int>(nl_its);
+  nl_its_prev = static_cast<int>(nl_its);
 
   return dt_new;
 }
 
-
 #endif // BOUT_HAS_PETSC

From b593a19fc834ccfd9717387f17397c4a54be4719 Mon Sep 17 00:00:00 2001
From: Peter Hill <peter.hill@york.ac.uk>
Date: Fri, 18 Jul 2025 09:18:58 +0100
Subject: [PATCH 116/129] Fix more clang-tidy warnings

---
 examples/laplacexy/laplace_perp/test.cxx |  4 +++-
 tests/MMS/laplace/laplace.cxx            | 18 +++++++++---------
 tests/MMS/spatial/d2dx2/test_d2dx2.cxx   |  7 +++++--
 tests/MMS/spatial/d2dz2/test_d2dz2.cxx   |  8 ++++++--
 4 files changed, 23 insertions(+), 14 deletions(-)

diff --git a/examples/laplacexy/laplace_perp/test.cxx b/examples/laplacexy/laplace_perp/test.cxx
index 291faffabc..75577bb8b7 100644
--- a/examples/laplacexy/laplace_perp/test.cxx
+++ b/examples/laplacexy/laplace_perp/test.cxx
@@ -1,4 +1,5 @@
 #include <bout/bout.hxx>
+#include <bout/field2d.hxx>
 
 #include <bout/derivs.hxx>
 #include <bout/field_factory.hxx>
@@ -51,7 +52,8 @@ int main(int argc, char** argv) {
   ///////////////////////////////////////
 
   // Read an analytic input
-  Field2D input = FieldFactory::get()->create2D("input_field", Options::getRoot(), mesh);
+  const Field2D input =
+      FieldFactory::get()->create2D("input_field", Options::getRoot(), mesh);
 
   // Create a LaplaceXY solver
   LaplaceXY laplacexy{mesh};
diff --git a/tests/MMS/laplace/laplace.cxx b/tests/MMS/laplace/laplace.cxx
index 15fc849d8f..fbcdee355c 100644
--- a/tests/MMS/laplace/laplace.cxx
+++ b/tests/MMS/laplace/laplace.cxx
@@ -1,8 +1,11 @@
 #include <bout/bout.hxx>
-
 #include <bout/constants.hxx>
+#include <bout/field3d.hxx>
 #include <bout/field_factory.hxx>
 #include <bout/invert_laplace.hxx>
+#include <bout/output.hxx>
+
+#include <string>
 
 using bout::globals::mesh;
 using namespace std::string_literals;
@@ -34,16 +37,13 @@ int main(int argc, char** argv) {
   FieldFactory fact(mesh);
 
   const auto input_name = "input_field"s;
-  std::shared_ptr<FieldGenerator> gen = fact.parse(input_name);
+  const auto gen = fact.parse(input_name);
   output.write("GEN = {}\n", gen->str());
 
-  Field3D input = fact.create3D(input_name);
-
-  Field3D result = lap->solve(input);
-
-  Field3D solution = fact.create3D("solution");
-
-  Field3D error = result - solution;
+  const Field3D input = fact.create3D(input_name);
+  const Field3D result = lap->solve(input);
+  const Field3D solution = fact.create3D("solution");
+  const Field3D error = result - solution;
 
   Options dump;
   dump["input"] = input;
diff --git a/tests/MMS/spatial/d2dx2/test_d2dx2.cxx b/tests/MMS/spatial/d2dx2/test_d2dx2.cxx
index 228dca4b2a..7f7127cea9 100644
--- a/tests/MMS/spatial/d2dx2/test_d2dx2.cxx
+++ b/tests/MMS/spatial/d2dx2/test_d2dx2.cxx
@@ -4,7 +4,9 @@
 
 #include <bout/bout.hxx>
 #include <bout/derivs.hxx>
+#include <bout/field3d.hxx>
 #include <bout/field_factory.hxx>
+#include <bout/options.hxx>
 
 using bout::globals::mesh;
 
@@ -13,7 +15,8 @@ int main(int argc, char** argv) {
   BoutInitialise(argc, argv);
 
   Field3D input = FieldFactory::get()->create3D("input_field", Options::getRoot(), mesh);
-  Field3D solution = FieldFactory::get()->create3D("solution", Options::getRoot(), mesh);
+  const Field3D solution =
+      FieldFactory::get()->create3D("solution", Options::getRoot(), mesh);
   // At this point the boundary cells are set to the analytic solution
 
   input.setBoundary("bndry");
@@ -21,7 +24,7 @@ int main(int argc, char** argv) {
 
   // Boundaries of input now set using extrapolation around mid-point boundary
 
-  Field3D result = D2DX2(input);
+  const Field3D result = D2DX2(input);
   // At this point result is not set in the boundary cells
 
   Options dump;
diff --git a/tests/MMS/spatial/d2dz2/test_d2dz2.cxx b/tests/MMS/spatial/d2dz2/test_d2dz2.cxx
index 9dccb6a992..68a12b062f 100644
--- a/tests/MMS/spatial/d2dz2/test_d2dz2.cxx
+++ b/tests/MMS/spatial/d2dz2/test_d2dz2.cxx
@@ -4,7 +4,9 @@
 
 #include <bout/bout.hxx>
 #include <bout/derivs.hxx>
+#include <bout/field3d.hxx>
 #include <bout/field_factory.hxx>
+#include <bout/options.hxx>
 
 using bout::globals::mesh;
 
@@ -12,8 +14,10 @@ int main(int argc, char** argv) {
 
   BoutInitialise(argc, argv);
 
-  Field3D input = FieldFactory::get()->create3D("input_field", Options::getRoot(), mesh);
-  Field3D solution = FieldFactory::get()->create3D("solution", Options::getRoot(), mesh);
+  const Field3D input =
+      FieldFactory::get()->create3D("input_field", Options::getRoot(), mesh);
+  const Field3D solution =
+      FieldFactory::get()->create3D("solution", Options::getRoot(), mesh);
 
   Field3D result = D2DZ2(input);
 

From e8277e4771f55013632bab87f5bd7a2a7678592a Mon Sep 17 00:00:00 2001
From: ZedThree <1486942+ZedThree@users.noreply.github.com>
Date: Fri, 18 Jul 2025 08:24:40 +0000
Subject: [PATCH 117/129] Apply clang-format changes

---
 src/bout++.cxx | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/bout++.cxx b/src/bout++.cxx
index 7f23cf5f91..4e9e37fe8d 100644
--- a/src/bout++.cxx
+++ b/src/bout++.cxx
@@ -84,7 +84,7 @@ const char DEFAULT_DIR[] = "data";
 // Define S_ISDIR if not defined by system headers (that is, MSVC)
 // Taken from https://github.com/curl/curl/blob/e59540139a398dc70fde6aec487b19c5085105af/lib/curl_setup.h#L748-L751
 #if !defined(S_ISDIR) && defined(S_IFMT) && defined(S_IFDIR)
-#define S_ISDIR(m) (((m)&S_IFMT) == S_IFDIR)
+#define S_ISDIR(m) (((m) & S_IFMT) == S_IFDIR)
 #endif
 
 #ifdef _MSC_VER

From 7c586e35f822d7c68018dfe9689a39e5ea144712 Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Mon, 14 Apr 2025 20:22:11 +0000
Subject: [PATCH 118/129] Bump ZedThree/clang-tidy-review from 0.20.1 to 0.21.0

Bumps [ZedThree/clang-tidy-review](https://github.com/zedthree/clang-tidy-review) from 0.20.1 to 0.21.0.
- [Release notes](https://github.com/zedthree/clang-tidy-review/releases)
- [Changelog](https://github.com/ZedThree/clang-tidy-review/blob/master/CHANGELOG.md)
- [Commits](https://github.com/zedthree/clang-tidy-review/compare/v0.20.1...v0.21.0)

---
updated-dependencies:
- dependency-name: ZedThree/clang-tidy-review
  dependency-version: 0.21.0
  dependency-type: direct:production
  update-type: version-update:semver-minor
...

Signed-off-by: dependabot[bot] <support@github.com>
---
 .github/workflows/clang-tidy-review.yml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/clang-tidy-review.yml b/.github/workflows/clang-tidy-review.yml
index 1e2f88d208..1a9a0ea079 100644
--- a/.github/workflows/clang-tidy-review.yml
+++ b/.github/workflows/clang-tidy-review.yml
@@ -22,7 +22,7 @@ jobs:
           submodules: true
 
       - name: Run clang-tidy
-        uses: ZedThree/clang-tidy-review@v0.20.1
+        uses: ZedThree/clang-tidy-review@v0.21.0
         id: review
         with:
           build_dir: build
@@ -47,4 +47,4 @@ jobs:
                              -DBOUT_UPDATE_GIT_SUBMODULE=OFF
 
       - name: Upload clang-tidy fixes
-        uses: ZedThree/clang-tidy-review/upload@v0.20.1
+        uses: ZedThree/clang-tidy-review/upload@v0.21.0

From d816d7819e128925fe806052aeebb5ecdac1eaf2 Mon Sep 17 00:00:00 2001
From: malamast <malamas.tsagkaridis@gmail.com>
Date: Fri, 18 Jul 2025 10:23:33 -0700
Subject: [PATCH 119/129] SNES: changes the pidController flag to
 pid_controller to match the variable naming convention.

---
 src/solver/impls/snes/snes.cxx | 10 +++++-----
 src/solver/impls/snes/snes.hxx |  2 +-
 2 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/src/solver/impls/snes/snes.cxx b/src/solver/impls/snes/snes.cxx
index 4f6c11fb42..8c10052e33 100644
--- a/src/solver/impls/snes/snes.cxx
+++ b/src/solver/impls/snes/snes.cxx
@@ -136,8 +136,8 @@ SNESSolver::SNESSolver(Options* opts)
       timestep_factor_on_lower_its((*options)["timestep_factor_on_lower_its"]
                                    .doc("Multiply timestep if iterations are below lower_its")
                                    .withDefault(1.4)),
-      pidController(
-          (*options)["pidController"].doc("Use PID controller?").withDefault(false)),
+      pid_controller(
+          (*options)["pid_controller"].doc("Use PID controller?").withDefault(false)),
       target_its((*options)["target_its"]
                     .doc("Target snes iterations")
                     .withDefault(static_cast<int>(7))),
@@ -647,7 +647,7 @@ int SNESSolver::init() {
     // Note: If the 'Amat' Jacobian is matrix free, SNESComputeJacobian
     //       always updates its reference 'u' vector every nonlinear iteration
     SNESSetLagJacobian(snes, lag_jacobian);
-    if (pidController){
+    if (pid_controller){
       nl_its_prev = target_its;
       nl_its_prev2 = target_its;
       SNESSetLagJacobianPersists(snes, PETSC_FALSE);
@@ -866,7 +866,7 @@ int SNESSolver::run() {
       }
 
 
-      if (pidController){
+      if (pid_controller){
         SNESSetLagJacobian(snes, lag_jacobian);
       }
 
@@ -1062,7 +1062,7 @@ int SNESSolver::run() {
 
       if (looping) {
 
-        if (pidController){
+        if (pid_controller){
           // Changing the timestep.
           // Note: The preconditioner depends on the timestep,
           // so we recalculate the jacobian and the preconditioner
diff --git a/src/solver/impls/snes/snes.hxx b/src/solver/impls/snes/snes.hxx
index 8a0b5bcecb..e31ca44625 100644
--- a/src/solver/impls/snes/snes.hxx
+++ b/src/solver/impls/snes/snes.hxx
@@ -108,7 +108,7 @@ private:
   BoutReal timestep_factor_on_lower_its;
 
   ///< PID controller parameters
-  bool pidController; ///< Use PID controller?
+  bool pid_controller; ///< Use PID controller?
   int target_its;     ///< Target number of nonlinear iterations for the PID controller.
   ///< Use with caution! Not tested values.
   BoutReal kP; ///< (0.6 - 0.8) Proportional parameter (main response to current step)

From 751a22f6ce2a75047c3e61047bfd4aec5ce62ee2 Mon Sep 17 00:00:00 2001
From: malamast <malamas.tsagkaridis@gmail.com>
Date: Thu, 24 Jul 2025 11:34:02 -0700
Subject: [PATCH 120/129] SNES: reapplied some changes from previous commits
 that accidentally got deleted.

---
 src/solver/impls/snes/snes.cxx | 37 +++++++++++-----------------------
 src/solver/impls/snes/snes.hxx |  2 +-
 2 files changed, 13 insertions(+), 26 deletions(-)

diff --git a/src/solver/impls/snes/snes.cxx b/src/solver/impls/snes/snes.cxx
index 6b0438bb8b..eda4e9e783 100644
--- a/src/solver/impls/snes/snes.cxx
+++ b/src/solver/impls/snes/snes.cxx
@@ -140,9 +140,7 @@ SNESSolver::SNESSolver(Options* opts)
               .withDefault(1.4)),
       pid_controller(
           (*options)["pid_controller"].doc("Use PID controller?").withDefault(false)),
-      target_its((*options)["target_its"]
-                     .doc("Target snes iterations")
-                     .withDefault(static_cast<int>(7))),
+      target_its((*options)["target_its"].doc("Target snes iterations").withDefault(7)),
       kP((*options)["kP"].doc("Proportional PID parameter").withDefault(0.7)),
       kI((*options)["kI"].doc("Integral PID parameter").withDefault(0.3)),
       kD((*options)["kD"].doc("Derivative PID parameter").withDefault(0.2)),
@@ -646,7 +644,7 @@ int SNESSolver::init() {
     // Note: If the 'Amat' Jacobian is matrix free, SNESComputeJacobian
     //       always updates its reference 'u' vector every nonlinear iteration
     SNESSetLagJacobian(snes, lag_jacobian);
-    if (pid_controller){
+    if (pid_controller) {
       nl_its_prev = target_its;
       nl_its_prev2 = target_its;
       SNESSetLagJacobianPersists(snes, PETSC_FALSE);
@@ -865,7 +863,7 @@ int SNESSolver::run() {
       }
 
 
-      if (pid_controller){
+      if (pid_controller) {
         SNESSetLagJacobian(snes, lag_jacobian);
       }
 
@@ -1061,7 +1059,7 @@ int SNESSolver::run() {
 
       if (looping) {
 
-        if (pid_controller){
+        if (pid_controller) {
           // Changing the timestep.
           // Note: The preconditioner depends on the timestep,
           // so we recalculate the jacobian and the preconditioner
@@ -1087,9 +1085,7 @@ int SNESSolver::run() {
             // Increase timestep slightly
             timestep *= timestep_factor_on_lower_its;
 
-            if (timestep > max_timestep) {
-              timestep = max_timestep;
-            }
+            timestep = std::min(timestep, max_timestep);
 
             // Note: Setting the SNESJacobianFn to NULL retains
             // previously set evaluation function.
@@ -1407,8 +1403,7 @@ void SNESSolver::updateColoring() {
   MatColoring coloring = NULL;
   MatColoringCreate(Jfd, &coloring);
   // MatColoringSetType(coloring, MATCOLORINGSL);  // Serial algorithm. Better for smale-to-medium size problems.
-  MatColoringSetType(
-      coloring, MATCOLORINGGREEDY); // Parallel algorith. Better for large parallel runs
+  MatColoringSetType(coloring, MATCOLORINGGREEDY); // Parallel algorith. Better for large parallel runs
   // MatColoringSetType(coloring, MATCOLORINGJP);  // This didn't work
   MatColoringSetFromOptions(coloring);
 
@@ -1438,28 +1433,20 @@ void SNESSolver::updateColoring() {
 BoutReal SNESSolver::pid(BoutReal timestep, int nl_its) {
 
   /* ---------- multiplicative PID factors ---------- */
-  BoutReal facP = std::pow(double(target_its) / double(nl_its), kP);
-  BoutReal facI = std::pow(double(nl_its_prev) / double(nl_its), kI);
-  BoutReal facD = std::pow(double(nl_its_prev) * double(nl_its_prev) / double(nl_its)
+  const BoutReal facP = std::pow(double(target_its) / double(nl_its), kP);
+  const BoutReal facI = std::pow(double(nl_its_prev) / double(nl_its), kI);
+  const BoutReal facD = std::pow(double(nl_its_prev) * double(nl_its_prev) / double(nl_its)
                                / double(nl_its_prev2),
                            kD);
 
   // clamp groth factor to avoid huge changes
-  BoutReal fac = facP * facI * facD;
-  if (fac < 0.2)
-    fac = 0.2;
-  else if (fac > 5.0)
-    fac = 5.0;
+  const BoutReal fac = std::clamp(facP * facI * facD, 0.2, 5.0);
 
   /* ---------- update timestep and history ---------- */
-  BoutReal dt_new = timestep * fac;
-
-  if (dt_new > max_timestep) {
-    dt_new = max_timestep;
-  }
+  const BoutReal dt_new = std::min(timestep * fac, max_timestep);
 
   nl_its_prev2 = nl_its_prev;
-  nl_its_prev = static_cast<int>(nl_its);
+  nl_its_prev = nl_its;
 
   return dt_new;
 }
diff --git a/src/solver/impls/snes/snes.hxx b/src/solver/impls/snes/snes.hxx
index e31ca44625..bd942f09ff 100644
--- a/src/solver/impls/snes/snes.hxx
+++ b/src/solver/impls/snes/snes.hxx
@@ -109,7 +109,7 @@ private:
 
   ///< PID controller parameters
   bool pid_controller; ///< Use PID controller?
-  int target_its;     ///< Target number of nonlinear iterations for the PID controller.
+  int target_its;      ///< Target number of nonlinear iterations for the PID controller.
   ///< Use with caution! Not tested values.
   BoutReal kP; ///< (0.6 - 0.8) Proportional parameter (main response to current step)
   BoutReal kI; ///< (0.2 - 0.4) Integral parameter (smooths history of changes)

From 865c0ab26987f393b9e8ab9294603259a501e3f1 Mon Sep 17 00:00:00 2001
From: malamast <42969991+malamast@users.noreply.github.com>
Date: Thu, 24 Jul 2025 19:35:33 +0000
Subject: [PATCH 121/129] Apply clang-format changes

---
 src/solver/impls/snes/snes.cxx | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/src/solver/impls/snes/snes.cxx b/src/solver/impls/snes/snes.cxx
index eda4e9e783..72891941b6 100644
--- a/src/solver/impls/snes/snes.cxx
+++ b/src/solver/impls/snes/snes.cxx
@@ -862,7 +862,6 @@ int SNESSolver::run() {
         VecAXPBY(snes_x, -beta, (1. + beta), x1);
       }
 
-
       if (pid_controller) {
         SNESSetLagJacobian(snes, lag_jacobian);
       }
@@ -1403,7 +1402,8 @@ void SNESSolver::updateColoring() {
   MatColoring coloring = NULL;
   MatColoringCreate(Jfd, &coloring);
   // MatColoringSetType(coloring, MATCOLORINGSL);  // Serial algorithm. Better for smale-to-medium size problems.
-  MatColoringSetType(coloring, MATCOLORINGGREEDY); // Parallel algorith. Better for large parallel runs
+  MatColoringSetType(
+      coloring, MATCOLORINGGREEDY); // Parallel algorith. Better for large parallel runs
   // MatColoringSetType(coloring, MATCOLORINGJP);  // This didn't work
   MatColoringSetFromOptions(coloring);
 
@@ -1435,9 +1435,9 @@ BoutReal SNESSolver::pid(BoutReal timestep, int nl_its) {
   /* ---------- multiplicative PID factors ---------- */
   const BoutReal facP = std::pow(double(target_its) / double(nl_its), kP);
   const BoutReal facI = std::pow(double(nl_its_prev) / double(nl_its), kI);
-  const BoutReal facD = std::pow(double(nl_its_prev) * double(nl_its_prev) / double(nl_its)
-                               / double(nl_its_prev2),
-                           kD);
+  const BoutReal facD = std::pow(double(nl_its_prev) * double(nl_its_prev)
+                                     / double(nl_its) / double(nl_its_prev2),
+                                 kD);
 
   // clamp groth factor to avoid huge changes
   const BoutReal fac = std::clamp(facP * facI * facD, 0.2, 5.0);

From dd146a80b92dbf4afe42dd426e572bd07eb9066c Mon Sep 17 00:00:00 2001
From: Tom Body <116750897+tbody-cfs@users.noreply.github.com>
Date: Wed, 16 Apr 2025 20:27:18 -0400
Subject: [PATCH 122/129] Update CMakeLists.txt

Address #2945
---
 CMakeLists.txt | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index c45fca3b72..9405c9e8d6 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -51,7 +51,7 @@ message(STATUS "Configuring BOUT++ version ${BOUT_FULL_VERSION}")
 project(BOUT++
   DESCRIPTION "Fluid PDE solver framework"
   VERSION ${BOUT_CMAKE_ACCEPTABLE_VERSION}
-  LANGUAGES CXX)
+  LANGUAGES C CXX)
 
 include(CMakeDependentOption)
 

From 5988480b4f509c24b76602405fe4d4133a3eeb9c Mon Sep 17 00:00:00 2001
From: Tom Body <tbody@cfs.energy>
Date: Fri, 18 Apr 2025 16:18:09 +0000
Subject: [PATCH 123/129] Move enable C to NetCDF

---
 cmake/FindnetCDF.cmake          | 1 +
 cmake/SetupBOUTThirdParty.cmake | 1 -
 2 files changed, 1 insertion(+), 1 deletion(-)

diff --git a/cmake/FindnetCDF.cmake b/cmake/FindnetCDF.cmake
index 393c57549b..361095954e 100644
--- a/cmake/FindnetCDF.cmake
+++ b/cmake/FindnetCDF.cmake
@@ -32,6 +32,7 @@ if (NOT netCDF_ROOT AND EXISTS "${BOUT_USE_NETCDF}")
   set(netCDF_ROOT "${BOUT_USE_NETCDF}")
 endif()
 
+enable_language(C)
 find_package(netCDF QUIET CONFIG)
 
 if (netCDF_FOUND)
diff --git a/cmake/SetupBOUTThirdParty.cmake b/cmake/SetupBOUTThirdParty.cmake
index 10942f8aa9..f8712c1b58 100644
--- a/cmake/SetupBOUTThirdParty.cmake
+++ b/cmake/SetupBOUTThirdParty.cmake
@@ -293,7 +293,6 @@ if (BOUT_USE_SUNDIALS)
     FetchContent_MakeAvailable(sundials)
     message(STATUS "SUNDIALS done configuring")
   else()
-    enable_language(C)
     find_package(SUNDIALS REQUIRED)
     if (SUNDIALS_VERSION VERSION_LESS 4.0.0)
       message(FATAL_ERROR "SUNDIALS_VERSION 4.0.0 or newer is required. Found version ${SUNDIALS_VERSION}.")

From 0f7c8546e6a5396c5c692a631bf103d0cde945bc Mon Sep 17 00:00:00 2001
From: Tom Body <tbody@cfs.energy>
Date: Fri, 18 Apr 2025 17:36:08 +0000
Subject: [PATCH 124/129] Remove top-level C

---
 CMakeLists.txt | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 9405c9e8d6..c45fca3b72 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -51,7 +51,7 @@ message(STATUS "Configuring BOUT++ version ${BOUT_FULL_VERSION}")
 project(BOUT++
   DESCRIPTION "Fluid PDE solver framework"
   VERSION ${BOUT_CMAKE_ACCEPTABLE_VERSION}
-  LANGUAGES C CXX)
+  LANGUAGES CXX)
 
 include(CMakeDependentOption)
 

From 0ab77ba7c88ba13d693d565423e2311abd59feac Mon Sep 17 00:00:00 2001
From: Tom Body <tbody@cfs.energy>
Date: Fri, 18 Apr 2025 18:47:12 +0000
Subject: [PATCH 125/129] Add back in C language for SUNDIALS

---
 cmake/SetupBOUTThirdParty.cmake | 1 +
 1 file changed, 1 insertion(+)

diff --git a/cmake/SetupBOUTThirdParty.cmake b/cmake/SetupBOUTThirdParty.cmake
index f8712c1b58..53ceb4351c 100644
--- a/cmake/SetupBOUTThirdParty.cmake
+++ b/cmake/SetupBOUTThirdParty.cmake
@@ -272,6 +272,7 @@ option(BOUT_DOWNLOAD_SUNDIALS "Download and build SUNDIALS" OFF)
 cmake_dependent_option(BOUT_USE_SUNDIALS "Enable support for SUNDIALS time solvers" OFF
   "NOT BOUT_DOWNLOAD_SUNDIALS" ON)
 if (BOUT_USE_SUNDIALS)
+  enable_language(C)
   if (BOUT_DOWNLOAD_SUNDIALS)
     message(STATUS "Downloading and configuring SUNDIALS")
     include(FetchContent)

From ec1f94f45ddfc0fe9cc9d83e8e4058d9b48af1b7 Mon Sep 17 00:00:00 2001
From: Ben Dudson <dudson2@llnl.gov>
Date: Wed, 13 Aug 2025 10:29:05 -0700
Subject: [PATCH 126/129] snes: Print a warning if the coloring is
 non-symmetric.

Added comments to explain why the coloring may be non-symmetric around
an X-point.
---
 src/solver/impls/snes/snes.cxx | 24 ++++++++++++++++++------
 1 file changed, 18 insertions(+), 6 deletions(-)

diff --git a/src/solver/impls/snes/snes.cxx b/src/solver/impls/snes/snes.cxx
index 72891941b6..134b63c2f8 100644
--- a/src/solver/impls/snes/snes.cxx
+++ b/src/solver/impls/snes/snes.cxx
@@ -377,8 +377,8 @@ int SNESSolver::init() {
       auto n_cross = (*options)["stencil:cross"]
                          .doc("Extent of stencil (cross)")
                          .withDefault<int>(0);
-      //Set n_taxi 2 if nothing else is set
-      //Probably a better way to do this
+      // Set n_taxi 2 if nothing else is set
+      // Probably a better way to do this
       if (n_square == 0 && n_taxi == 0 && n_cross == 0) {
         output_info.write("Setting solver:stencil:taxi = 2\n");
         n_taxi = 2;
@@ -485,7 +485,7 @@ int SNESSolver::init() {
         d_nnz.reserve(nlocal);
 
         for (int i = 0; i < nlocal; ++i) {
-          //Assume all elements in the z direction are potentially coupled
+          // Assume all elements in the z direction are potentially coupled
           d_nnz.emplace_back(d_nnz_map3d[i].size() * mesh->LocalNz
                              + d_nnz_map2d[i].size());
           o_nnz.emplace_back(o_nnz_map3d[i].size() * mesh->LocalNz
@@ -598,9 +598,21 @@ int SNESSolver::init() {
       MatAssemblyBegin(Jfd, MAT_FINAL_ASSEMBLY);
       MatAssemblyEnd(Jfd, MAT_FINAL_ASSEMBLY);
 
-      //The above will probably miss some non-zero entries at process boundaries
-      //Making sure the colouring matrix is symmetric will in some/all(?)
-      //of the missing non-zeros
+      {
+        // Test if the matrix is symmetric
+        // Values are 0 or 1 so tolerance (1e-5) shouldn't matter
+        PetscBool symmetric;
+        ierr = MatIsSymmetric(Jfd, 1e-5, &symmetric); CHKERRQ(ierr);
+        if (!symmetric) {
+          output_warn.write("Jacobian pattern is not symmetric\n");
+        }
+      }
+
+      // The above can miss entries around the X-point branch cut:
+      // The diagonal terms are complicated because moving in X then Y
+      // is different from moving in Y then X at the X-point.
+      // Making sure the colouring matrix is symmetric does not
+      // necessarily give the correct stencil but may help.
       if ((*options)["force_symmetric_coloring"]
               .doc("Modifies coloring matrix to force it to be symmetric")
               .withDefault<bool>(false)) {

From cf7e0437af135d4812ae77bf9819dbb918c7a838 Mon Sep 17 00:00:00 2001
From: bendudson <219233+bendudson@users.noreply.github.com>
Date: Wed, 13 Aug 2025 22:37:55 +0000
Subject: [PATCH 127/129] Apply clang-format changes

---
 src/solver/impls/snes/snes.cxx | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/solver/impls/snes/snes.cxx b/src/solver/impls/snes/snes.cxx
index 134b63c2f8..2bb163f324 100644
--- a/src/solver/impls/snes/snes.cxx
+++ b/src/solver/impls/snes/snes.cxx
@@ -602,7 +602,8 @@ int SNESSolver::init() {
         // Test if the matrix is symmetric
         // Values are 0 or 1 so tolerance (1e-5) shouldn't matter
         PetscBool symmetric;
-        ierr = MatIsSymmetric(Jfd, 1e-5, &symmetric); CHKERRQ(ierr);
+        ierr = MatIsSymmetric(Jfd, 1e-5, &symmetric);
+        CHKERRQ(ierr);
         if (!symmetric) {
           output_warn.write("Jacobian pattern is not symmetric\n");
         }

From 89c20ec95e17a5b1c564e58512f8482ce3a20958 Mon Sep 17 00:00:00 2001
From: tomc271 <tomc271@gmail.com>
Date: Wed, 20 Aug 2025 11:09:30 +0100
Subject: [PATCH 128/129] snakecase for function
 CylindricalCoordinatesToCartesian()

---
 include/bout/tokamak_coordinates.hxx              | 2 +-
 src/mesh/tokamak_coordinates.cxx                  | 2 +-
 tests/unit/mesh/test_change_coordinate_system.cxx | 2 +-
 3 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/include/bout/tokamak_coordinates.hxx b/include/bout/tokamak_coordinates.hxx
index dd1629799c..0f3f2ea65f 100644
--- a/include/bout/tokamak_coordinates.hxx
+++ b/include/bout/tokamak_coordinates.hxx
@@ -35,7 +35,7 @@ namespace bout {
 
         void normalise(BoutReal Lbar, BoutReal Bbar, BoutReal ShearFactor);
 
-        Coordinates3D CylindricalCoordinatesToCartesian();
+        Coordinates3D cylindrical_coordinates_to_cartesian();
     };
 
     BoutReal get_sign_of_bp(const Field2D &Bpxy);
diff --git a/src/mesh/tokamak_coordinates.cxx b/src/mesh/tokamak_coordinates.cxx
index 740d19e325..d90ec43078 100644
--- a/src/mesh/tokamak_coordinates.cxx
+++ b/src/mesh/tokamak_coordinates.cxx
@@ -36,7 +36,7 @@ namespace bout {
         }
     }
 
-    Coordinates3D TokamakOptions::CylindricalCoordinatesToCartesian() {
+    Coordinates3D TokamakOptions::cylindrical_coordinates_to_cartesian() {
 
         auto* mesh = Rxy.getMesh();
         Field3D x = Field3D(0.0, mesh);
diff --git a/tests/unit/mesh/test_change_coordinate_system.cxx b/tests/unit/mesh/test_change_coordinate_system.cxx
index d9ae71e14c..d513007d65 100644
--- a/tests/unit/mesh/test_change_coordinate_system.cxx
+++ b/tests/unit/mesh/test_change_coordinate_system.cxx
@@ -49,7 +49,7 @@ TEST_F(CoordinateTransformTest, CylindricalToCartesian) {
     }
 
     // act
-    bout::Coordinates3D cartesian_coords = tokamak_options.CylindricalCoordinatesToCartesian();
+    bout::Coordinates3D cartesian_coords = tokamak_options.cylindrical_coordinates_to_cartesian();
 
     // assert
     const auto max_r = *std::max_element(begin(r_values), end(r_values));

From b512667e11ea02bdc45e181197923c280806902a Mon Sep 17 00:00:00 2001
From: tomc271 <tomc271@gmail.com>
Date: Wed, 20 Aug 2025 13:18:17 +0100
Subject: [PATCH 129/129] Merge branch 'refactor-coordinates' into
 cylindrical-to-cartesian into fake_mesh_fixture.hxx

---
 tests/unit/fake_mesh_fixture.hxx | 54 ++++++++++++++++++--------------
 1 file changed, 31 insertions(+), 23 deletions(-)

diff --git a/tests/unit/fake_mesh_fixture.hxx b/tests/unit/fake_mesh_fixture.hxx
index 2758dbe416..3c2215acba 100644
--- a/tests/unit/fake_mesh_fixture.hxx
+++ b/tests/unit/fake_mesh_fixture.hxx
@@ -41,28 +41,32 @@ public:
     bout::globals::mpi = &mpi;
     bout::globals::mesh = &mesh_m;
     bout::globals::mesh->createDefaultRegions();
-    mesh_m.setCoordinates(nullptr);
+    static_cast<FakeMesh*>(bout::globals::mesh)->setCoordinates(nullptr);
     test_coords = std::make_shared<Coordinates>(
         bout::globals::mesh, Field2D{1.0}, Field2D{1.0}, Field2D{1.0}, Field2D{1.0},
         Field2D{1.0}, Field2D{1.0}, Field2D{1.0}, Field2D{1.0}, Field2D{0.0},
         Field2D{0.0}, Field2D{0.0}, Field2D{1.0}, Field2D{1.0}, Field2D{1.0},
         Field2D{0.0}, Field2D{0.0}, Field2D{0.0}, Field2D{0.0}, Field2D{0.0});
 
-    // Set some auxilliary variables
-    // Usually set in geometry()
-    // Note: For testing these are set to non-zero values
-    test_coords->G1 = test_coords->G2 = test_coords->G3 = 0.1;
-
     // Set nonuniform corrections
-    test_coords->non_uniform = true;
-    test_coords->d1_dx = test_coords->d1_dy = 0.2;
-    test_coords->d1_dz = 0.0;
+    test_coords->setNon_uniform(true);
+    test_coords->setD1_dx(0.2);
+    test_coords->setD1_dy(0.2);
+    test_coords->setD1_dz(0.0);
+
 #if BOUT_USE_METRIC_3D
-    test_coords->Bxy.splitParallelSlices();
-    test_coords->Bxy.yup() = test_coords->Bxy.ydown() = test_coords->Bxy;
+
+    FieldMetric mutable_Bxy = test_coords->Bxy();
+    mutable_Bxy.splitParallelSlices();
+    test_coords->setBxy(mutable_Bxy);
+
+    mutable_Bxy = test_coords->Bxy();
+    mutable_Bxy.yup() = test_coords->Bxy();
+    mutable_Bxy.ydown() = test_coords->Bxy();
+    test_coords->setBxy(mutable_Bxy);
+
 #endif
 
-    // No call to Coordinates::geometry() needed here
     mesh_m.setCoordinates(test_coords);
     mesh_m.setGridDataSource(new FakeGridDataSource());
     // May need a ParallelTransform to create fields, because create3D calls
@@ -90,21 +94,25 @@ public:
         Field2D{0.0, &mesh_staggered_m}, Field2D{0.0, &mesh_staggered_m},
         Field2D{0.0, &mesh_staggered_m}, Field2D{0.0, &mesh_staggered_m});
 
-    // Set some auxilliary variables
-    test_coords_staggered->G1 = test_coords_staggered->G2 = test_coords_staggered->G3 =
-        0.1;
-
     // Set nonuniform corrections
-    test_coords_staggered->non_uniform = true;
-    test_coords_staggered->d1_dx = test_coords_staggered->d1_dy = 0.2;
-    test_coords_staggered->d1_dz = 0.0;
+    test_coords_staggered->setNon_uniform(true);
+    test_coords_staggered->setD1_dx(0.2);
+    test_coords_staggered->setD1_dy(0.2);
+    test_coords_staggered->setD1_dz(0.0);
+
 #if BOUT_USE_METRIC_3D
-    test_coords_staggered->Bxy.splitParallelSlices();
-    test_coords_staggered->Bxy.yup() = test_coords_staggered->Bxy.ydown() =
-        test_coords_staggered->Bxy;
+
+    mutable_Bxy = test_coords_staggered->Bxy();
+    mutable_Bxy.splitParallelSlices();
+    test_coords_staggered->setBxy(mutable_Bxy);
+
+    mutable_Bxy = test_coords_staggered->Bxy();
+    mutable_Bxy.yup() = test_coords_staggered->Bxy();
+    mutable_Bxy.ydown() = test_coords_staggered->Bxy();
+    test_coords_staggered->setBxy(mutable_Bxy);
+
 #endif
 
-    // No call to Coordinates::geometry() needed here
     test_coords_staggered->setParallelTransform(
         bout::utils::make_unique<ParallelTransformIdentity>(mesh_staggered_m));