From 1fa1e04f6b5ef60547fe8ec5190a49891137907e Mon Sep 17 00:00:00 2001
From: Andrew Shao <Andrew.Shao@hpe.com>
Date: Mon, 29 Sep 2025 12:43:18 -0500
Subject: [PATCH 1/3] Add weighted loss function

Adjust the loss function to weight by the distance from the
"center" of the ellipsoid by an exponent d (e.g. r^{d}).
Additionally, reduce the default size of the MLP to avoid having
an overdetermined system (# of free parameters > samples).
---
 Allwmake                            |   2 +-
 run/meshMotion/ml_model_training.py | 106 ++++++++++++++--------------
 run/meshMotion/smartsim_driver.py   |  67 ++++++++++++------
 3 files changed, 99 insertions(+), 76 deletions(-)

diff --git a/Allwmake b/Allwmake
index 4dc38d0..e0430ee 100755
--- a/Allwmake
+++ b/Allwmake
@@ -39,7 +39,7 @@ elif [ $WM_COMPILER == "Icx" ]; then
 fi
 make lib
 cd "$_REPO_ROOT" || exit 1
-cp $FOAM_SMARTREDIS/install/lib/libsmartredis.so $FOAM_USER_LIBBIN 
+cp $FOAM_SMARTREDIS/install/lib64/libsmartredis.so $FOAM_USER_LIBBIN 
 cp $FOAM_SMARTREDIS/build/Release/hiredis-prefix/src/hiredis-build/libhiredis.a $FOAM_USER_LIBBIN
 cp $FOAM_SMARTREDIS/build/Release/redis++-prefix/src/redis++-build/libredis++.a $FOAM_USER_LIBBIN
 export FOAM_CODE_TEMPLATES=$_REPO_ROOT/etc/dynamicCode/
diff --git a/run/meshMotion/ml_model_training.py b/run/meshMotion/ml_model_training.py
index 7983477..12b3643 100644
--- a/run/meshMotion/ml_model_training.py
+++ b/run/meshMotion/ml_model_training.py
@@ -5,7 +5,7 @@
 import numpy as np
 import io
 from sklearn.model_selection import train_test_split
-import torch.optim as optim 
+import torch.optim as optim
 import time
 from typing import Tuple, Union
 from matplotlib import pyplot as plt
@@ -30,7 +30,14 @@ def __init__(self, num_layers, layer_width, input_size, output_size, activation_
     def forward(self, x):
         return self.layers(x)
 
-def train(num_mpi_ranks):
+def loss_weighted_center(y_true, y_pred, weights, weights_power):
+    weights_normed = torch.pow(weights, weights_power)
+    weights_normed = weights_normed/torch.sum(weights_normed)
+
+    return torch.sum(torch.sum((y_true-y_pred)**2, dim=1)*weights_normed)
+
+
+def train(args):
     client = Client()
     torch.set_default_dtype(torch.float64)
 
@@ -38,24 +45,24 @@ def train(num_mpi_ranks):
     dimension = int(client.get_tensor("solution_dim"))
 
     print (f"Solution dimension = {dimension}.")
-    
+
     # Initialize the model
     model = MLP(
-        num_layers=3, 
-        layer_width=50, 
-        input_size=dimension, 
-        output_size=dimension, 
-        activation_fn=torch.nn.ReLU()
+        num_layers=3,
+        layer_width=10,
+        input_size=dimension,
+        output_size=dimension,
+        activation_fn=torch.nn.ELU()
     )
 
     # Initialize the optimizer
-    learning_rate = 1e-03
+    learning_rate = 1e-3
     optimizer = optim.Adam(model.parameters(), lr=learning_rate)
-    
+
     # Make sure all datasets are avaialble in the smartredis database.
     iteration = 1
     while True:
-    
+
         print (f"Iteration {iteration}")
 
         data_ready = client.poll_key("data_ready", 1, 10000)
@@ -64,66 +71,60 @@ def train(num_mpi_ranks):
 
         points = client.get_tensor("points")
         displacements = client.get_tensor("displacements")
+
         client.delete_tensor("data_ready")
 
-        # Split training and validation data 
-        points_train, points_val, displ_train, displ_val = train_test_split(
-            points,
-            displacements,
-            test_size=0.2,
-            random_state=42
-        )
+        X = torch.from_numpy(points).to(torch.float64)
+        y = torch.from_numpy(displacements).to(torch.float64)
+
+        # Find the center of the shape as the average of all the points on the inner boundary
+        r = torch.sqrt(torch.sum(X**2, dim=1))
+        inner = r < 5
+        center = torch.mean(X[inner], dim=0)
+
+        dist = torch.sqrt(torch.sum((X-center)**2, dim=1))
+        wts = dist/torch.sum(dist)
 
-        # Convert to torch.Tensor 
-        points_train = torch.from_numpy(points_train).to(torch.float64)
-        points_val   = torch.from_numpy(points_val).to(torch.float64)
-        displ_train  = torch.from_numpy(displ_train).to(torch.float64)
-        displ_val    = torch.from_numpy(displ_val).to(torch.float64)
-    
-        loss_func = nn.MSELoss()
-      
-        mean_mag_displ = torch.mean(torch.norm(displ_train, dim=1))
         validation_rmse = []
         model.train()
-        epochs = 2000
+        epochs = 5000
         n_epochs = 0
-        rmse_loss_val = 1
 
-        for epoch in range(epochs):    
+        for epoch in range(epochs):
             # Zero the gradients
             optimizer.zero_grad()
-    
+
             # Forward pass on the training data
-            displ_pred = model(points_train)
-    
+            displ_pred = model(X)
+
             # Compute loss on the training data
-            loss_train = loss_func(displ_pred, displ_train)
-    
+            loss_train = loss_weighted_center(displ_pred, y, wts, args.radius_power)
+
+            if (loss_train < 5e-05):
+                break
+
             # Backward pass and optimization
             loss_train.backward()
             optimizer.step()
 
             n_epochs = n_epochs + 1
-            # Forward pass on the validation data, with torch.no_grad() for efficiency
-            with torch.no_grad():
-                displ_pred_val = model(points_val)
-                mse_loss_val = loss_func(displ_pred_val, displ_val)
-                rmse_loss_val = torch.sqrt(mse_loss_val)
-                validation_rmse.append(rmse_loss_val)
-                if (mse_loss_val < 1e-04):
-                    break
-    
-        print (f"RMSE {validation_rmse[-1]}, number of epochs {n_epochs}")
+
+        print (f"MSE {loss_train.item()}, number of epochs {n_epochs}", flush=True)
+        np.savez(
+            f"data_{iteration:02d}.npz",
+            points=points,
+            displacements=displacements,
+        )
 
         # Uncomment to visualize validation RMSE
         plt.loglog()
         plt.title("Validation loss RMSE")
         plt.xlabel("Epochs")
         plt.plot(validation_rmse)
-        plt.savefig(f"validation_rmse_{epoch:04d}.png")
-    
+        plt.savefig(f"validation_rmse_{iteration:04d}.png")
+
         # Store the model into SmartRedis
-        # Put the model in evaluation mode. 
+        # Put the model in evaluation mode.
         model.eval() # TEST
         # Prepare a sample input
         example_forward_input = torch.rand(dimension)
@@ -136,11 +137,11 @@ def train(num_mpi_ranks):
         print("Saving model")
         client.set_model("model", model_buffer.getvalue(), "TORCH", "CPU")
         client.put_tensor("model_ready", np.array([0]))
-    
-        # Increase CFD+ML iteration 
+
+        # Increase CFD+ML iteration
         iteration = iteration + 1
 
-        # Check final iteration index and break 
+        # Check final iteration index and break
         if client.poll_key("final_iteration", 10, 10):
            print ("final iteration reached.")
            break
@@ -148,6 +149,7 @@ def train(num_mpi_ranks):
 if __name__ == "__main__":
     parser = argparse.ArgumentParser(description="Training script for mesh motion")
     parser.add_argument("mpi_ranks", help="number of mpi ranks", type=int)
+    parser.add_argument("radius_power", help="power law to weight losses", type=float)
     args = parser.parse_args()
 
-    train(args.mpi_ranks)
+    train(args)
diff --git a/run/meshMotion/smartsim_driver.py b/run/meshMotion/smartsim_driver.py
index 863a627..e612e08 100644
--- a/run/meshMotion/smartsim_driver.py
+++ b/run/meshMotion/smartsim_driver.py
@@ -8,33 +8,30 @@
 
 from smartsim import Experiment
 
-def main():
-    parser = argparse.ArgumentParser(
-        description="Run a SmartSim Machine-Learning mesh deformation experiment"
-    )
-    parser.add_argument(
-        "--experiment", "-e",
-        required=True,
-        help="Name of the SmartSim experiment (e.g., mesh_deformation)"
-    )
-    parser.add_argument(
-        "--case", "-c",
-        required=True,
-        help="Name of the OpenFOAM case folder (e.g., ellipsoid3D)"
-    )
-    args = parser.parse_args()
+platform_config = {
+    "local": {
+        "launcher": "local",
+        "interface": "lo"
+    },
+    "hotlum": {
+        "launcher": "slurm",
+        "interface": "bond0"
+    }
+}
+
+def main(args):
 
     # ----------------------------------------------------------------
     # Create the SmartSim experiment
     # ----------------------------------------------------------------
 
-    exp = Experiment(args.experiment, launcher="local")
+    exp = Experiment(args.experiment, launcher=platform_config[args.platform]["launcher"])
 
     # ----------------------------------------------------------------
     # Launch the database
     # ----------------------------------------------------------------
 
-    db = exp.create_database(port=8000, interface="lo")
+    db = exp.create_database(port=8000, interface=platform_config[args.platform]["interface"])
     exp.generate(db, overwrite=True)
     exp.start(db)
     print(f"Database started at: {db.get_address()}")
@@ -55,16 +52,15 @@ def main():
     # ----------------------------------------------------------------
     # Configure and create the OpenFOAM mesh-motion model
     # ----------------------------------------------------------------
-    
-    # Create OpenFOAM moveDynamicMesh run settings 
+
+    # Create OpenFOAM moveDynamicMesh run settings
     openfoam_rs = exp.create_run_settings(
         exe="moveDynamicMesh",
         exe_args="-parallel",
-        run_command="mpirun",
-        run_args={"n": f"{num_mpi_ranks}"}
     )
     openfoam_rs.set_tasks(num_mpi_ranks)
     openfoam_rs.set_nodes(1)
+    openfoam_rs.set("exclusive")
 
     # Create the model from the OpenFOAM case argument
     openfoam_model = exp.create_model(
@@ -79,7 +75,7 @@ def main():
 
     training_rs = exp.create_run_settings(
         exe="python",
-        exe_args=f"ml_model_training.py {num_mpi_ranks}"
+        exe_args=f"ml_model_training.py {num_mpi_ranks} {args.radius_power}"
     )
     training_rs.set_tasks(1)
     training_rs.set_nodes(1)
@@ -111,4 +107,29 @@ def main():
         exp.stop(db)
 
 if __name__ == "__main__":
-    main()
+    parser = argparse.ArgumentParser(
+        description="Run a SmartSim Machine-Learning mesh deformation experiment"
+    )
+    parser.add_argument(
+        "--experiment", "-e",
+        required=True,
+        help="Name of the SmartSim experiment (e.g., mesh_deformation)"
+    )
+    parser.add_argument(
+        "--case", "-c",
+        required=True,
+        help="Name of the OpenFOAM case folder (e.g., ellipsoid3D)"
+    )
+    parser.add_argument(
+        "--radius_power",
+        default=0,
+        help="Power law associated with the loss function"
+    )
+    parser.add_argument(
+        "--platform",
+        choices=["slurm", "hotlum"],
+        default="local",
+        help="The platform on which this is being run"
+    )
+    args = parser.parse_args()
+    main(args)

From a07cea6eb442bafdda48d999880803c757545073 Mon Sep 17 00:00:00 2001
From: Andrew Shao <Andrew.Shao@hpe.com>
Date: Tue, 7 Oct 2025 13:16:52 -0500
Subject: [PATCH 2/3] Only post boundary points on initialization

Modify the solve routine and add a new method called during the,
meshMotion constructor so that the boundary points are only posted
once.
---
 .../displacementSmartSimMotionSolver.C        | 228 ++++++++++--------
 .../displacementSmartSimMotionSolver.H        |  31 +--
 2 files changed, 150 insertions(+), 109 deletions(-)

diff --git a/src/fvMotionSolvers/displacementSmartSimMotionSolver/displacementSmartSimMotionSolver.C b/src/fvMotionSolvers/displacementSmartSimMotionSolver/displacementSmartSimMotionSolver.C
index 7714640..5fc0758 100644
--- a/src/fvMotionSolvers/displacementSmartSimMotionSolver/displacementSmartSimMotionSolver.C
+++ b/src/fvMotionSolvers/displacementSmartSimMotionSolver/displacementSmartSimMotionSolver.C
@@ -5,7 +5,7 @@
     \\  /    A nd           | www.openfoam.com
      \\/     M anipulation  |
 -------------------------------------------------------------------------------
-    Copyright (C) 2023 Tomislav Maric, TU Darmstadt 
+    Copyright (C) 2023 Tomislav Maric, TU Darmstadt
 -------------------------------------------------------------------------------
 License
     This file is part of OpenFOAM.
@@ -56,12 +56,12 @@ namespace Foam
     );
 }
 
-Foam::labelList Foam::displacementSmartSimMotionSolver::filterValidCmpts(const Vector<label>& dims) 
+Foam::labelList Foam::displacementSmartSimMotionSolver::filterValidCmpts(const Vector<label>& dims)
 {
-    labelList valid; 
+    labelList valid;
 
-    forAll(dims, dI) 
-        if (dims[dI] == 1)  // Active solution dimension in OpenFOAM 
+    forAll(dims, dI)
+        if (dims[dI] == 1)  // Active solution dimension in OpenFOAM
             valid.push_back(dI); // Valid dimension 0 (x), 1 (y), or 2 (z)
 
     return valid;
@@ -69,27 +69,27 @@ Foam::labelList Foam::displacementSmartSimMotionSolver::filterValidCmpts(const V
 
 // * * * * * * * * * * * * * Private Member Functions * * * * * * * * * * * * * * //
 
-void Foam::displacementSmartSimMotionSolver::writeSolutionDimToDatabase() 
+void Foam::displacementSmartSimMotionSolver::writeSolutionDimToDatabase()
 {
     client_.put_tensor("solution_dim",
-                        &solutionDim_, 
+                        &solutionDim_,
                         {1},
-                        SRTensorTypeInt32, 
+                        SRTensorTypeInt32,
                         SRMemLayoutContiguous);
 }
 
-void Foam::displacementSmartSimMotionSolver::writeMeshPointsToDatabase() 
+void Foam::displacementSmartSimMotionSolver::writeMeshPointsToDatabase()
 {
     const auto& meshPoints = points0(); //fvMesh_.points();
 
     if (solutionDim_ == 3) // 3D case
     {
         // Send existing 3D mesh points for forward inference: nPoints,
-        // dim=3. Saves time and memory in avoiding to create a 2D point buffer. 
+        // dim=3. Saves time and memory in avoiding to create a 2D point buffer.
         client_.put_tensor(rankMeshPointsName_,
-                           meshPoints.cdata(), 
+                           meshPoints.cdata(),
                            {size_t(meshPoints.size()), 3},
-                           SRTensorTypeDouble, 
+                           SRTensorTypeDouble,
                            SRMemLayoutContiguous);
     }
     else if (solutionDim_ == 2) // OpenFOAM pseudo 2D case
@@ -105,14 +105,81 @@ void Foam::displacementSmartSimMotionSolver::writeMeshPointsToDatabase()
             // 3D meshPoint data.
             points2D[2*pointI] = meshPoints[pointI][validCmpts_[0]];
             points2D[2*pointI + 1] = meshPoints[pointI][validCmpts_[1]];
-        } 
+        }
 
         // Send points2D to SmartRedis
         client_.put_tensor(
             rankMeshPointsName_,
-            points2D.data(), 
+            points2D.data(),
             {size_t(meshPoints.size()), size_t(solutionDim_)},
-            SRTensorTypeDouble, 
+            SRTensorTypeDouble,
+            SRMemLayoutContiguous
+        );
+    }
+}
+
+void Foam::displacementSmartSimMotionSolver::writeBoundaryPointsToDatabase()
+{
+    const pointField& points0 = this->points0();
+    List<point> mpiRankPoints;
+    const auto& meshBoundary = motionSolver::mesh().boundaryMesh();
+    const auto& boundaryDisplacements = pointDisplacement().boundaryField();
+    // Aggregate all points on the boundaries
+    forAll(boundaryDisplacements, patchI)
+    {
+        if (meshBoundary[patchI].type() == "empty"
+           || meshBoundary[patchI].type() == "processor")
+        {
+           continue;
+        }
+
+        const polyPatch& patch   = meshBoundary[patchI];
+        const labelList& patchPointIds = patch.meshPoints();
+
+        forAll(patchPointIds, id)
+        {
+            mpiRankPoints.append(points0[patchPointIds[id]]);
+        }
+    }
+
+    List<List<point>>   globalPointListList(Pstream::nProcs());
+    globalPointListList[Pstream::myProcNo()] = mpiRankPoints;
+    Pstream::gatherList(globalPointListList);
+
+    // - Send data to SmartRedis for ML model training from the main rank (0)
+    if (Pstream::myProcNo() == 0)
+    {
+        // - Compute the global number of boundary points and displacements.
+        label nGlobalBoundaryPoints = 0;
+        forAll(globalPointListList, rankI)
+        {
+            nGlobalBoundaryPoints += globalPointListList[rankI].size();
+        }
+        // - Resize agglomerated point and displacement data to equal size.
+        boundaryPoints_.resize(nGlobalBoundaryPoints * solutionDim_);
+
+        // - Agglomerate the gathered boundary List<List<vector>> points and
+        // displacements into boundaryPoints_ and boundaryDisplacements_ attributes.
+        label globalCmptI = 0;
+        forAll(globalPointListList, rankI)
+        {
+            // Get the list of points from each rank
+            const List<point>& rankPoints = globalPointListList[rankI];
+            forAll(rankPoints, pointI)
+            {
+                forAll(validCmpts_, dimI)
+                {
+                    boundaryPoints_[globalCmptI] = rankPoints[pointI][validCmpts_[dimI]];
+                    ++globalCmptI;
+                }
+            }
+        }
+        // Send points to SmartRedis for ML model training.
+        client_.put_tensor(
+            "points",
+            boundaryPoints_.data(),
+            {size_t(nGlobalBoundaryPoints), size_t(solutionDim_)},
+            SRTensorTypeDouble,
             SRMemLayoutContiguous
         );
     }
@@ -128,23 +195,24 @@ Foam::displacementSmartSimMotionSolver::displacementSmartSimMotionSolver
 :
     displacementMotionSolver(mesh, dict, typeName),
     fvMotionSolver(mesh),
-    clusterMode_(this->coeffDict().get<bool>("clusterMode")), 
-    client_(clusterMode_), 
+    clusterMode_(this->coeffDict().get<bool>("clusterMode")),
+    client_(clusterMode_),
     solutionDim_(
-        std::accumulate( 
-            fvMesh_.solutionD().cbegin(),   
-            fvMesh_.solutionD().cend(),     
-            0                               
+        std::accumulate(
+            fvMesh_.solutionD().cbegin(),
+            fvMesh_.solutionD().cend(),
+            0
         )
     ),
     validCmpts_(filterValidCmpts(fvMesh_.solutionD())),
     rankMeshPointsName_("points_MPI_" + std::to_string(Pstream::myProcNo())),
     rankMeshDisplacementsName_("displacements_MPI_" + std::to_string(Pstream::myProcNo())),
-    boundaryPoints_(), 
+    boundaryPoints_(),
     boundaryDisplacements_()
 {
     writeSolutionDimToDatabase();
     writeMeshPointsToDatabase();
+    writeBoundaryPointsToDatabase();
 }
 
 Foam::displacementSmartSimMotionSolver::
@@ -161,20 +229,21 @@ displacementSmartSimMotionSolver
     clusterMode_(dict.getOrDefault<bool>("clusterMode", true)),
     client_(clusterMode_),
     solutionDim_(
-        std::accumulate( 
-            fvMesh_.solutionD().cbegin(),   
-            fvMesh_.solutionD().cend(),     
-            0                               
+        std::accumulate(
+            fvMesh_.solutionD().cbegin(),
+            fvMesh_.solutionD().cend(),
+            0
         )
     ),
     validCmpts_(filterValidCmpts(fvMesh_.solutionD())),
     rankMeshPointsName_("points_MPI_" + std::to_string(Pstream::myProcNo())),
     rankMeshDisplacementsName_("displacements_MPI_" + std::to_string(Pstream::myProcNo())),
-    boundaryPoints_(), 
+    boundaryPoints_(),
     boundaryDisplacements_()
 {
     writeSolutionDimToDatabase();
     writeMeshPointsToDatabase();
+    writeBoundaryPointsToDatabase();
 }
 
 // * * * * * * * * * * * * * * * * Destructor  * * * * * * * * * * * * * * * //
@@ -196,20 +265,13 @@ Foam::tmp<Foam::pointField> Foam::displacementSmartSimMotionSolver::curPoints()
     return tcurPoints;
 }
 
-void Foam::displacementSmartSimMotionSolver::solve() 
+void Foam::displacementSmartSimMotionSolver::solve()
 {
     // The points have moved so before interpolation update
     pointDisplacement_.boundaryFieldRef().evaluate();
 
-    // Assemble and send boundary points and their displacements to SmartRedis 
-
-    // - Agglomerate boundary points and displacements for the MPI rank
-
-    // TODO(TM,AS): move the points0 agglomeration and writing to writeMeshPointsToDatabase  
-    const pointField& points0 = this->points0(); // MOVE
+    const auto& meshBoundary = motionSolver::mesh().boundaryMesh();
     const auto& boundaryDisplacements = pointDisplacement().boundaryField();
-    const auto& meshBoundary = motionSolver::mesh().boundaryMesh(); 
-    List<point> mpiRankPoints; // MOVE 
     List<vector> mpiRankDisplacements;
     forAll(boundaryDisplacements, patchI)
     {
@@ -218,97 +280,75 @@ void Foam::displacementSmartSimMotionSolver::solve()
         {
            continue;
         }
-
         tmp<vectorField> dispPtr = boundaryDisplacements[patchI].patchInternalField();
         const vectorField& disp  = dispPtr();
 
-        const polyPatch& patch   = meshBoundary[patchI]; // MOVE
-        const labelList& patchPointIds = patch.meshPoints();  // MOVE
-
-        forAll(patchPointIds, id)
+        forAll(disp, id)
         {
-            mpiRankPoints.append(points0[patchPointIds[id]]); // MOVE
-            mpiRankDisplacements.append(disp[id]);
+            if (disp[id].size() > 0) mpiRankDisplacements.append(disp[id]);
         }
     }
 
     // - Prepare global displacement and point lists for gather
-    List<List<point>>   globalPointListList(Pstream::nProcs()); // MOVE
     List<List<vector>>  globalDisplacementListList(Pstream::nProcs());
 
-    // - Assign data in the lobal lists list from this MPI rank
-    globalPointListList[Pstream::myProcNo()] = mpiRankPoints; // MOVE
+    // - Assign data in the global lists list from this MPI rank
     globalDisplacementListList[Pstream::myProcNo()] = mpiRankDisplacements;
 
     // - Gather all data from all ranks at the main rank (0)
-    Pstream::gatherList(globalPointListList); // MOVE
     Pstream::gatherList(globalDisplacementListList);
 
     // - Send data to SmartRedis for ML model training from the main rank (0)
-    if (Pstream::myProcNo() == 0) 
+    if (Pstream::myProcNo() == 0)
     {
-        // - Compute the global number of boundary points and displacements. 
-        label nGlobalBoundaryPoints = 0;  // MOVE
-        forAll(globalPointListList, rankI) // MOVE
+        // - Compute the global number of boundary points and displacements.
+
+        label nGlobalBoundaryDisplacements= 0;
+        forAll(globalDisplacementListList, rankI)
         {
-            nGlobalBoundaryPoints += globalPointListList[rankI].size(); // MOVE
+            nGlobalBoundaryDisplacements += globalDisplacementListList[rankI].size();
         }
-        
-        // - Resize agglomerated point and displacement data to equal size. 
-        boundaryPoints_.resize(nGlobalBoundaryPoints * solutionDim_); // MOVE
-        boundaryDisplacements_.resize(nGlobalBoundaryPoints * solutionDim_);
+        boundaryDisplacements_.resize(nGlobalBoundaryDisplacements * solutionDim_);
 
         // - Agglomerate the gathered boundary List<List<vector>> points and
-        // displacements into boundaryPoints_ and boundaryDisplacements_ attributes. 
+        // displacements into boundaryPoints_ and boundaryDisplacements_ attributes.
         label globalCmptI = 0;
-        forAll(globalPointListList, rankI)
+        forAll(globalDisplacementListList, rankI)
         {
-            // Get the list of points from each rank 
-            const List<point>& rankPoints = globalPointListList[rankI]; // MOVE
-            // Get the list of displacements from each rank 
+            // Get the list of displacements from each rank
             const List<point>& rankDisplacements = globalDisplacementListList[rankI];
 
             // Assign rank points and rank displacements to boundaryPoints_ and
-            // boundaryDisplacements_. 
+            // boundaryDisplacements_.
             // meshPoints [1,2,3],[4,5,6]
             // validCmpts [0,2] - xz axis is the solution plane.
-            // globalPoints_ = [1,3,4,6] - viewed as [1,3], [4,6].   
+            // globalPoints_ = [1,3,4,6] - viewed as [1,3], [4,6].
 
             // Iteration step is therefore point * solution dimension for
             // globalPoints_  and globalDisplacements_
-            forAll(rankPoints, pointI)
+            forAll(rankDisplacements, pointI)
             {
                 forAll(validCmpts_, dimI)
                 {
-                    boundaryPoints_[globalCmptI] = rankPoints[pointI][validCmpts_[dimI]]; // MOVE
                     boundaryDisplacements_[globalCmptI] = rankDisplacements[pointI][validCmpts_[dimI]];
                     ++globalCmptI;
                 }
             }
         }
 
-        // Send points to SmartRedis for ML model training.
-        client_.put_tensor( // MOVE
-            "points",
-            boundaryPoints_.data(), 
-            {size_t(nGlobalBoundaryPoints), size_t(solutionDim_)},
-            SRTensorTypeDouble, 
-            SRMemLayoutContiguous
-        );
-
         client_.put_tensor(
             "displacements",
-            boundaryDisplacements_.data(), 
-            {size_t(nGlobalBoundaryPoints), size_t(solutionDim_)},
-            SRTensorTypeDouble, 
+            boundaryDisplacements_.data(),
+            {size_t(nGlobalBoundaryDisplacements), size_t(solutionDim_)},
+            SRTensorTypeDouble,
             SRMemLayoutContiguous
         );
 
         client_.put_tensor(
-            "data_ready", 
-            &solutionDim_, 
+            "data_ready",
+            &solutionDim_,
             {1},
-            SRTensorTypeInt32, 
+            SRTensorTypeInt32,
             SRMemLayoutContiguous
         );
     }
@@ -316,19 +356,19 @@ void Foam::displacementSmartSimMotionSolver::solve()
     // Refresh points_MPI_<rank> with current mesh points.
     // writeMeshPointsToDatabase();  // TODO(TM): can we remove this using points0 displacements?
 
-    bool model_ready = client_.poll_key("model_ready", 1, 10000);
+    bool model_ready = client_.poll_key("model_ready", 1, 100000);
     if (! model_ready)
     {
         FatalErrorInFunction
             << "Displacement model not available in the SmartRedis database."
             << exit(Foam::FatalError);
     }
-    else // Perform forward inference in the database and assign rank-displacements 
+    else // Perform forward inference in the database and assign rank-displacements
     {
         // Perform the forward inference in SmartRedis
         client_.run_model(
-            "model", 
-            {rankMeshPointsName_}, 
+            "model",
+            {rankMeshPointsName_},
             {rankMeshDisplacementsName_}
         );
 
@@ -346,7 +386,7 @@ void Foam::displacementSmartSimMotionSolver::solve()
             {rankMeshDisplacements.size()},
             SRTensorTypeDouble,
             SRMemLayoutContiguous
-        );   
+        );
 
         label globalId = 0;
         pointVectorField newDisplacement("newDisplacement", pointDisplacement_);
@@ -358,24 +398,24 @@ void Foam::displacementSmartSimMotionSolver::solve()
                 ++globalId;
             }
         }
-        //newDisplacement.boundaryFieldRef().evaluate(); 
-        pointDisplacement_.internalFieldRef() = newDisplacement.internalField(); 
-        pointDisplacement_.boundaryFieldRef().evaluate(); 
+        //newDisplacement.boundaryFieldRef().evaluate();
+        pointDisplacement_.internalFieldRef() = newDisplacement.internalField();
+        pointDisplacement_.boundaryFieldRef().evaluate();
     }
 
-    // At the end of the simulation, have MPI rank 0 notify the python 
+    // At the end of the simulation, have MPI rank 0 notify the python
     // client via SmartRedis that the simulation has completed by writing
-    // an end_time_index tensor to SmartRedis. 
+    // an end_time_index tensor to SmartRedis.
     const auto& runTime = fvMesh_.time();
-    if ((Pstream::myProcNo() == 0) &&  
+    if ((Pstream::myProcNo() == 0) &&
         (runTime.timeOutputValue() >= runTime.endTime().value()))
     {
         std::vector<double> end_time_vec {double(runTime.timeIndex())};
         Info << "Seting end time flag : " << end_time_vec[0] << endl;
         client_.put_tensor(
-            "final_iteration", 
-            end_time_vec.data(), 
-            {1}, 
+            "final_iteration",
+            end_time_vec.data(),
+            {1},
             SRTensorTypeDouble, SRMemLayoutContiguous
         );
     }
diff --git a/src/fvMotionSolvers/displacementSmartSimMotionSolver/displacementSmartSimMotionSolver.H b/src/fvMotionSolvers/displacementSmartSimMotionSolver/displacementSmartSimMotionSolver.H
index b23ba8f..158adc9 100644
--- a/src/fvMotionSolvers/displacementSmartSimMotionSolver/displacementSmartSimMotionSolver.H
+++ b/src/fvMotionSolvers/displacementSmartSimMotionSolver/displacementSmartSimMotionSolver.H
@@ -5,7 +5,7 @@
     \\  /    A nd           | www.openfoam.com
      \\/     M anipulation  |
 -------------------------------------------------------------------------------
-    Copyright (C) 2023 Tomislav Maric, TU Darmstadt 
+    Copyright (C) 2023 Tomislav Maric, TU Darmstadt
 -------------------------------------------------------------------------------
 License
     This file is part of OpenFOAM.
@@ -32,7 +32,7 @@ Group
 Description
 
     Mesh motion solver for an fvMesh. Globally approximates mesh displacement
-    using Machine Learning Models. Coupling with ML is done using SmartSim. 
+    using Machine Learning Models. Coupling with ML is done using SmartSim.
 
 SourceFiles
     displacementSmartSimMotionSolver.C
@@ -66,28 +66,28 @@ class displacementSmartSimMotionSolver
 
         ////- Interpolation used to transfer cell displacement to the points
         //autoPtr<motionInterpolation> interpolationPtr_;
-    
-        //- Set to false if not using a clustered database 
+
+        //- Set to false if not using a clustered database
         bool clusterMode_;
 
         //- SmartRedis Database Client
         SmartRedis::Client client_;
-        
+
         //- Spatial dimension - necessary for CFD+ML dimension consistency.
-        //- OpenFOAM ignores simply components in pseudo 2D cases; NNs cannot 
+        //- OpenFOAM ignores simply components in pseudo 2D cases; NNs cannot
         //  be trained on components whose values are all constant (zeros).
-        const label solutionDim_; 
+        const label solutionDim_;
 
         // - Which vector components correspond to solution dimensions:
         //   fvMesh::solutionD() = [1, 0, 1] -> solutionComponents_ = [0, 2]
-        const labelList validCmpts_; 
+        const labelList validCmpts_;
 
-        // - SmartRedis tensor names for ML inference for each MPI rank. 
+        // - SmartRedis tensor names for ML inference for each MPI rank.
         const word rankMeshPointsName_;
         const word rankMeshDisplacementsName_;
-        
-        // - Flattened boundary points sent to SmartRedis for ML 
-        std::vector<double> boundaryPoints_; 
+
+        // - Flattened boundary points sent to SmartRedis for ML
+        std::vector<double> boundaryPoints_;
 
         // - Flattened boundary displacements sent to SmartRedis for ML
         std::vector<double> boundaryDisplacements_;
@@ -103,8 +103,9 @@ class displacementSmartSimMotionSolver
 
         static labelList filterValidCmpts(const Vector<label>& solutionDim);
 
-        void writeSolutionDimToDatabase(); 
-        void writeMeshPointsToDatabase(); 
+        void writeSolutionDimToDatabase();
+        void writeMeshPointsToDatabase();
+        void writeBoundaryPointsToDatabase();
 
 public:
 
@@ -140,7 +141,7 @@ public:
     virtual tmp<pointField> curPoints() const;
 
     //- Solve for motion
-    virtual void solve(); 
+    virtual void solve();
 
 };
 

From 92953a73e0fa1b08c29085bf58a2385d68705b41 Mon Sep 17 00:00:00 2001
From: Andrew Shao <andrew.shao@hpe.com>
Date: Wed, 8 Oct 2025 00:10:29 +0000
Subject: [PATCH 3/3] Continue to modularize trainer

Break the definition and particulars of model training out of the
training script into their own files. To include a new model,
users should add another file to networks directory and create
two new classes: the model class which defines the architecture
and the trainer class which controls how the model is trained
---
 run/meshMotion/.gitignore           |   1 +
 run/meshMotion/ml_model_training.py | 100 ++++++++--------------------
 run/meshMotion/networks/MLP.py      |  56 ++++++++++++++++
 run/meshMotion/requirements.txt     |   2 +
 run/meshMotion/smartsim_driver.py   |   8 ++-
 5 files changed, 92 insertions(+), 75 deletions(-)
 create mode 100644 run/meshMotion/networks/MLP.py
 create mode 100644 run/meshMotion/requirements.txt

diff --git a/run/meshMotion/.gitignore b/run/meshMotion/.gitignore
index a8c86b9..bc09812 100644
--- a/run/meshMotion/.gitignore
+++ b/run/meshMotion/.gitignore
@@ -2,3 +2,4 @@
 *.stl 
 *.csv
 *.pdf
+ellipsoid3D_MachineLearningMeshMotion/*
diff --git a/run/meshMotion/ml_model_training.py b/run/meshMotion/ml_model_training.py
index 12b3643..9dfc346 100644
--- a/run/meshMotion/ml_model_training.py
+++ b/run/meshMotion/ml_model_training.py
@@ -1,40 +1,13 @@
 import argparse
-from smartredis import Client
 import torch
-import torch.nn as nn
 import numpy as np
 import io
-from sklearn.model_selection import train_test_split
 import torch.optim as optim
-import time
-from typing import Tuple, Union
-from matplotlib import pyplot as plt
-
-from sklearn.metrics import mean_squared_error
-
-class MLP(nn.Module):
-    def __init__(self, num_layers, layer_width, input_size, output_size, activation_fn):
-        super(MLP, self).__init__()
-
-        layers = []
-        layers.append(nn.Linear(input_size, layer_width))
-        layers.append(activation_fn)
-
-        for _ in range(num_layers - 2):
-            layers.append(nn.Linear(layer_width, layer_width))
-            layers.append(activation_fn)
 
-        layers.append(nn.Linear(layer_width, output_size))
-        self.layers = nn.Sequential(*layers)
-
-    def forward(self, x):
-        return self.layers(x)
-
-def loss_weighted_center(y_true, y_pred, weights, weights_power):
-    weights_normed = torch.pow(weights, weights_power)
-    weights_normed = weights_normed/torch.sum(weights_normed)
+from matplotlib import pyplot as plt
+from smartredis import Client
 
-    return torch.sum(torch.sum((y_true-y_pred)**2, dim=1)*weights_normed)
+from MLP import MLP, MLPTrainer
 
 
 def train(args):
@@ -42,24 +15,27 @@ def train(args):
     torch.set_default_dtype(torch.float64)
 
     # Read the solution direction from a database
-    dimension = int(client.get_tensor("solution_dim"))
+    dimension = int(client.get_tensor("solution_dim")[0])
 
     print (f"Solution dimension = {dimension}.")
-
     # Initialize the model
-    model = MLP(
-        num_layers=3,
-        layer_width=10,
-        input_size=dimension,
-        output_size=dimension,
-        activation_fn=torch.nn.ELU()
-    )
-
-    # Initialize the optimizer
-    learning_rate = 1e-3
-    optimizer = optim.Adam(model.parameters(), lr=learning_rate)
+    if args.model_name == "mlp":
+        model = MLP(
+            input_size=dimension,
+            output_size=dimension,
+            num_layers=3,
+            layer_width=10,
+            activation_fn=torch.nn.ELU()
+        )
+        trainer = MLPTrainer(model, args.radius_power)
 
+    data_ready = client.poll_key("points", 1, 10000)
+    points = client.get_tensor("points")
+    interior_points = np.vstack([client.get_tensor(f"points_MPI_{i}" for i in range(4))])
+    X = torch.from_numpy(points).to(torch.float64)
     # Make sure all datasets are avaialble in the smartredis database.
+
+    epochs = 5000
     iteration = 1
     while True:
 
@@ -69,47 +45,22 @@ def train(args):
         if (not data_ready):
             raise RuntimeError("Data not found in SmartRedis; aborting training.")
 
-        points = client.get_tensor("points")
         displacements = client.get_tensor("displacements")
-
+        interior_points = client.get_tensor
         client.delete_tensor("data_ready")
 
-        X = torch.from_numpy(points).to(torch.float64)
         y = torch.from_numpy(displacements).to(torch.float64)
 
-        # Find the center of the shape as the average of all the points on the inner boundary
-        r = torch.sqrt(torch.sum(X**2, dim=1))
-        inner = r < 5
-        center = torch.mean(X[inner], dim=0)
-
-        dist = torch.sqrt(torch.sum((X-center)**2, dim=1))
-        wts = dist/torch.sum(dist)
 
         validation_rmse = []
-        model.train()
-        epochs = 5000
         n_epochs = 0
 
         for epoch in range(epochs):
-            # Zero the gradients
-            optimizer.zero_grad()
-
-            # Forward pass on the training data
-            displ_pred = model(X)
-
-            # Compute loss on the training data
-            loss_train = loss_weighted_center(displ_pred, y, wts, args.radius_power)
-
-            if (loss_train < 5e-05):
+            loss, model = trainer.training_step(X, y)
+            if trainer.converged():
                 break
 
-            # Backward pass and optimization
-            loss_train.backward()
-            optimizer.step()
-
-            n_epochs = n_epochs + 1
-
-        print (f"MSE {loss_train.item()}, number of epochs {n_epochs}", flush=True)
+        print(f"MSE {loss.item()}, number of epochs {epoch}", flush=True)
         np.savez(
             f"data_{iteration:02d}.npz",
             points=points,
@@ -150,6 +101,11 @@ def train(args):
     parser = argparse.ArgumentParser(description="Training script for mesh motion")
     parser.add_argument("mpi_ranks", help="number of mpi ranks", type=int)
     parser.add_argument("radius_power", help="power law to weight losses", type=float)
+    parser.add_argument("model_name",
+                        help="which model to use to calculate interior displacements",
+                        choices=["mlp"],
+                        type=str
+    )
     args = parser.parse_args()
 
     train(args)
diff --git a/run/meshMotion/networks/MLP.py b/run/meshMotion/networks/MLP.py
new file mode 100644
index 0000000..4b72270
--- /dev/null
+++ b/run/meshMotion/networks/MLP.py
@@ -0,0 +1,56 @@
+import torch
+import torch.nn as nn
+import torch.optim as optim
+
+class MLP(nn.Module):
+  def __init__(self, input_size, output_size, activation_fn, num_layers, layer_width):
+      super(MLP, self).__init__()
+
+      layers = []
+      layers.append(nn.Linear(input_size, layer_width))
+      layers.append(activation_fn)
+
+      for _ in range(num_layers - 2):
+          layers.append(nn.Linear(layer_width, layer_width))
+          layers.append(activation_fn)
+
+      layers.append(nn.Linear(layer_width, output_size))
+      self.layers = nn.Sequential(*layers)
+
+  def forward(self, x):
+      return self.layers(x)
+
+class MLPTrainer:
+  def __init__(self, model, radius_power, lr=1e-3, loss_stop=5e-5):
+    self.model = model
+    self.optimizer = optim.Adam(model.parameters(), lr=lr)
+    self.loss_stop = loss_stop
+    self.loss_value = None
+    self.radius_power = radius_power
+
+  def loss(self, X, y_true):
+    inner = y_true != 0.
+    center = torch.mean(X[inner], dim=0)
+    scaled_dist = torch.sqrt(torch.sum((X-center)**2, dim=1))**self.radius_power
+    wts = scaled_dist/torch.sum(scaled_dist)
+
+    y_pred = self.model(X)
+    return torch.sum(wts*torch.sum(torch.sqrt((y_true-y_pred)**2), dim=1))
+
+  def training_step(self, X, y_true):
+     self.optimizer.zero_grad()
+     loss_value = self.loss(X, y_true)
+     self.loss_value = loss_value
+     loss_value.backward()
+     self.optimizer.step()
+
+     return loss_value, self.model
+
+  def converged(self):
+     if self.loss_value.item() < self.loss_stop:
+        return True
+     return False
+
+
+
+
diff --git a/run/meshMotion/requirements.txt b/run/meshMotion/requirements.txt
new file mode 100644
index 0000000..8ea9fb0
--- /dev/null
+++ b/run/meshMotion/requirements.txt
@@ -0,0 +1,2 @@
+gmsh
+PyFoam
diff --git a/run/meshMotion/smartsim_driver.py b/run/meshMotion/smartsim_driver.py
index e612e08..bc61602 100644
--- a/run/meshMotion/smartsim_driver.py
+++ b/run/meshMotion/smartsim_driver.py
@@ -57,10 +57,10 @@ def main(args):
     openfoam_rs = exp.create_run_settings(
         exe="moveDynamicMesh",
         exe_args="-parallel",
+        run_command="mpirun"
     )
     openfoam_rs.set_tasks(num_mpi_ranks)
     openfoam_rs.set_nodes(1)
-    openfoam_rs.set("exclusive")
 
     # Create the model from the OpenFOAM case argument
     openfoam_model = exp.create_model(
@@ -75,7 +75,7 @@ def main(args):
 
     training_rs = exp.create_run_settings(
         exe="python",
-        exe_args=f"ml_model_training.py {num_mpi_ranks} {args.radius_power}"
+        exe_args=f"ml_model_training.py {num_mpi_ranks} {args.radius_power} mlp"
     )
     training_rs.set_tasks(1)
     training_rs.set_nodes(1)
@@ -84,7 +84,9 @@ def main(args):
         name="ml_model_training",
         run_settings=training_rs
     )
-    ml_model_training.attach_generator_files(to_copy="ml_model_training.py")
+    ml_model_training.attach_generator_files(
+        to_copy=["ml_model_training.py", "networks/MLP.py"]
+    )
 
     exp.generate(ml_model_training, overwrite=True)