MFlowCode · mrvandenboom · Jan 15, 2026 · coderabbitai · Jan 15, 2026 · Copilot
diff --git a/toolchain/modules b/toolchain/modules
@@ -83,11 +83,11 @@ san-all cmake python
 san-gpu nvhpc cuda cray-mpich
 
 h     hipergator
-h-gpu nvhpc/25.9
-h-gpu CUDA_HOME="/apps/compilers/cuda/12.8.1"
-h-all HPC_OMPI_DIR="/apps/mpi/cuda/12.8.1/nvhpc/25.3/openmpi/5.0.7"
-h-all HPC_OMPI_BIN="/apps/mpi/cuda/12.8.1/nvhpc/25.3/openmpi/5.0.7/bin"
-h-all OMPI_MCA_pml=ob1 OMPI_MCA_coll_hcoll_enable=0
-h-gpu PATH="/apps/mpi/cuda/12.8.1/nvhpc/25.3/openmpi/5.0.7/bin:${PATH}"
-h-all LD_LIBRARY_PATH=/apps/compilers/cuda/12.8.1/lib64:$LD_LIBRARY_PATH
-h-gpu MFC_CUDA_CC=100 NVHPC_CUDA_HOME="/apps/compilers/cuda/12.8.1"
+h-all python/3.12
+h-cpu gcc/14.2 openmpi/5.0.7
+h-gpu UCX_NET_DEVICES="mlx5_4:1,mlx5_7:1,mlx5_8:1,mlx5_9:1,mlx5_10:1,mlx5_13:1,mlx5_14:1,mlx5_15:1"
+h-gpu cuda/12.9.1 nvhpc/25.9 openmpi/5.0.7
+h-gpu CC=/apps/compilers/nvhpc/25.9/Linux_x86_64/25.9/comm_libs/mpi/bin/mpicc 
+h-gpu CXX=/apps/compilers/nvhpc/25.9/Linux_x86_64/25.9/comm_libs/mpi/bin/mpicxx
+h-gpu FC=/apps/compilers/nvhpc/25.9/Linux_x86_64/25.9/comm_libs/mpi/bin/mpifort
+h-gpu NVCOMPILER_COMM_LIBS_HOME=/apps/compilers/nvhpc/25.9/Linux_x86_64/25.9/comm_libs/12.9
diff --git a/toolchain/templates/hipergator.mako b/toolchain/templates/hipergator.mako
@@ -8,10 +8,11 @@
 #SBATCH --job-name="${name}"
 #SBATCH --output="${name}.out"
 #SBATCH --time=${walltime}
-#SBATCH --cpus-per-task=7
 % if gpu_enabled:
-% if gpu_enabled:
+% if gpu_enabled:
+# Note: For GPU jobs, we explicitly request 1 GPU and 3 CPUs per task.
+#       CPU-only jobs rely on the cluster's default cpus-per-task setting.
-% if gpu_enabled:
+% if gpu_enabled:
+# Note: For GPU jobs, we explicitly request 1 GPU and 3 CPUs per task.
+#       CPU-only jobs rely on the cluster's default cpus-per-task setting.
 #SBATCH --gpus-per-task=1
+#SBATCH --cpus-per-task=3
 #SBATCH --gpu-bind=closest
+#SBATCH --mem-per-cpu=50GB
-#SBATCH --mem-per-cpu=50GB
+#SBATCH --mem-per-cpu=5GB
-#SBATCH --mem-per-cpu=50GB
+#SBATCH --mem-per-cpu=5GB
 % endif
-% if gpu_enabled:
-#SBATCH --gpus-per-task=1
-#SBATCH --cpus-per-task=3
-#SBATCH --gpu-bind=closest
-#SBATCH --mem-per-cpu=50GB
-% endif
+% if gpu_enabled:
+#SBATCH --gpus-per-task=1
+#SBATCH --cpus-per-task=3
+#SBATCH --mem-per-cpu=50GB
+% else:
+#SBATCH --cpus-per-task=7
+% endif
-% if gpu_enabled:
-#SBATCH --gpus-per-task=1
-#SBATCH --cpus-per-task=3
-#SBATCH --gpu-bind=closest
-#SBATCH --mem-per-cpu=50GB
-% endif
+% if gpu_enabled:
+#SBATCH --gpus-per-task=1
+#SBATCH --cpus-per-task=3
+#SBATCH --mem-per-cpu=50GB
+% else:
+#SBATCH --cpus-per-task=7
+% endif
 % if account:
 #SBATCH --account=${account}
@@ -48,7 +49,7 @@ echo
         (set -x; ${profiler} "${target.get_install_binpath(case)}")
     % else:
         (set -x; ${profiler}    \
-            mpirun -np ${nodes*tasks_per_node}            \
+            /apps/compilers/nvhpc/25.9/Linux_x86_64/25.9/comm_libs/mpi/bin/mpirun -np ${nodes*tasks_per_node}            \
-            /apps/compilers/nvhpc/25.9/Linux_x86_64/25.9/comm_libs/mpi/bin/mpirun -np ${nodes*tasks_per_node}            \
+            mpirun -np ${nodes*tasks_per_node}            \
-            /apps/compilers/nvhpc/25.9/Linux_x86_64/25.9/comm_libs/mpi/bin/mpirun -np ${nodes*tasks_per_node}            \
+            ${'/apps/compilers/nvhpc/25.9/Linux_x86_64/25.9/comm_libs/mpi/bin/mpirun' if gpu_enabled else 'mpirun'} -np ${nodes*tasks_per_node}            \
+
-            /apps/compilers/nvhpc/25.9/Linux_x86_64/25.9/comm_libs/mpi/bin/mpirun -np ${nodes*tasks_per_node}            \
+            mpirun -np ${nodes*tasks_per_node}            \
-            /apps/compilers/nvhpc/25.9/Linux_x86_64/25.9/comm_libs/mpi/bin/mpirun -np ${nodes*tasks_per_node}            \
+            ${'/apps/compilers/nvhpc/25.9/Linux_x86_64/25.9/comm_libs/mpi/bin/mpirun' if gpu_enabled else 'mpirun'} -np ${nodes*tasks_per_node}            \
+
                    --bind-to none                         \
                    "${target.get_install_binpath(case)}")
     % endif
-    % else:
-        (set -x; ${profiler}    \
-            mpirun -np ${nodes*tasks_per_node}            \
-            /apps/compilers/nvhpc/25.9/Linux_x86_64/25.9/comm_libs/mpi/bin/mpirun -np ${nodes*tasks_per_node}            \
-                   --bind-to none                         \
-                   "${target.get_install_binpath(case)}")
-    % endif
+    /apps/compilers/nvhpc/25.9/Linux_x86_64/comm_libs/mpi/bin/mpirun -np ${nodes*tasks_per_node}            \
-    % else:
-        (set -x; ${profiler}    \
-            mpirun -np ${nodes*tasks_per_node}            \
-            /apps/compilers/nvhpc/25.9/Linux_x86_64/25.9/comm_libs/mpi/bin/mpirun -np ${nodes*tasks_per_node}            \
-                   --bind-to none                         \
-                   "${target.get_install_binpath(case)}")
-    % endif
+    /apps/compilers/nvhpc/25.9/Linux_x86_64/comm_libs/mpi/bin/mpirun -np ${nodes*tasks_per_node}            \