Merge branch 'gitlab-ci' into mock_development

WeiqunZhang · WeiqunZhang · commit 555648232adb · 2025-11-15T10:46:28.000-08:00
diff --git a/.gitlab/hpsf-gitlab-ci.yml b/.gitlab/hpsf-gitlab-ci.yml
@@ -0,0 +1,84 @@
+Nvidia-H100-single-precision:
+  stage: test
+  tags: [nvidia-h100]
+  image: nvcr.io/nvidia/cuda:12.8.0-devel-ubuntu24.04
+  script:
+    - apt-get update && apt-get install -y cmake git python3 libopenmpi-dev openmpi-bin
+    - |
+      cmake -S . -B build                              \
+          -DCMAKE_VERBOSE_MAKEFILE=ON                  \
+          -DAMReX_PRECISION=SINGLE                     \
+          -DAMReX_PARTICLES_PRECISION=SINGLE           \
+          -DAMReX_SPACEDIM="1;2;3"                     \
+          -DAMReX_FFT=ON                               \
+          -DAMReX_EB=ON                                \
+          -DAMReX_ENABLE_TESTS=ON                      \
+          -DAMReX_FORTRAN=OFF                          \
+          -DAMReX_GPU_BACKEND=CUDA                     \
+          -DCMAKE_C_COMPILER=$(which gcc)              \
+          -DCMAKE_CXX_COMPILER=$(which g++)            \
+          -DCMAKE_CUDA_HOST_COMPILER=$(which g++)      \
+          -DAMReX_CUDA_ARCH="9.0"                      \
+          -DAMReX_CUDA_ERROR_CROSS_EXECUTION_SPACE_CALL=ON \
+          -DAMReX_CUDA_ERROR_CAPTURE_THIS=ON
+    - cmake --build build -j 16
+    - export OMPI_ALLOW_RUN_AS_ROOT=1
+    - export OMPI_ALLOW_RUN_AS_ROOT_CONFIRM=1
+    - export AMREX_THE_ARENA_INIT_SIZE=1e9
+    - ctest -j 2 --test-dir build --output-on-failure
+
+AMD-MI300A:
+  stage: test
+  tags: [amd-mi300]
+  image: rocm/dev-ubuntu-24.04:6.4.3-complete
+  script:
+    - apt-get update && apt-get install -y cmake git libopenmpi-dev openmpi-bin
+    - export ROCM_PATH=/opt/rocm-6.4.3
+    - export PATH=$ROCM_PATH/bin:$ROCM_PATH/llvm/bin:$PATH
+    - export LD_LIBRARY_PATH=$ROCM_PATH/lib:$ROCM_PATH/lib64:$LD_LIBRARY_PATH
+    - export HIP_PATH=$ROCM_PATH
+    - export HIP_CLANG_PATH=$ROCM_PATH/llvm/bin
+    - export CMAKE_PREFIX_PATH=$ROCM_PATH:$CMAKE_PREFIX_PATH
+    - |
+      cmake -S . -B build                              \
+          -DCMAKE_VERBOSE_MAKEFILE=ON                  \
+          -DAMReX_SPACEDIM="1;2;3"                     \
+          -DAMReX_FFT=ON                               \
+          -DAMReX_EB=ON                                \
+          -DAMReX_ENABLE_TESTS=ON                      \
+          -DAMReX_FORTRAN=OFF                          \
+          -DAMReX_GPU_BACKEND=HIP                      \
+          -DAMReX_AMD_ARCH=gfx942                      \
+          -DCMAKE_C_COMPILER=$(which clang)            \
+          -DCMAKE_CXX_COMPILER=$(which clang++)        \
+          -DCMAKE_CXX_STANDARD=17
+    - cmake --build build -j 16
+    - export OMPI_ALLOW_RUN_AS_ROOT=1
+    - export OMPI_ALLOW_RUN_AS_ROOT_CONFIRM=1
+    - export AMREX_THE_ARENA_INIT_SIZE=1e9
+    - ctest -j 2 --test-dir build --output-on-failure
+
+Intel-PVC:
+  stage: test
+  tags: [intel-data-center-max-1100]
+  image: intel/oneapi-basekit:2025.3.0-0-devel-ubuntu24.04
+  script:
+    - apt-get update && apt-get install -y git
+    - sycl-ls
+    - export ONEAPI_DEVICE_SELECTOR=level_zero:gpu
+    - |
+      cmake -S . -B build                              \
+          -DCMAKE_VERBOSE_MAKEFILE=ON                  \
+          -DAMReX_MPI=OFF                              \
+          -DAMReX_SPACEDIM="1;2;3"                     \
+          -DAMReX_FFT=ON                               \
+          -DAMReX_EB=ON                                \
+          -DAMReX_ENABLE_TESTS=ON                      \
+          -DAMReX_FORTRAN=OFF                          \
+          -DAMReX_GPU_BACKEND=SYCL                     \
+          -DCMAKE_C_COMPILER=$(which icx)              \
+          -DCMAKE_CXX_COMPILER=$(which icpx)           \
+          -DAMReX_PARALLEL_LINK_JOBS=8
+    - cmake --build build -j 16
+    - export AMREX_THE_ARENA_INIT_SIZE=1e9
+    - ctest -j 4 --test-dir build --output-on-failure
diff --git a/Docs/sphinx_documentation/source/GPU.rst b/Docs/sphinx_documentation/source/GPU.rst
@@ -560,8 +560,16 @@ to :cpp:`The_Arena()` to reduce memory fragmentation.
 In :cpp:`amrex::Initialize`, a large amount of GPU device memory is
 allocated and is kept in :cpp:`The_Arena()`.  The default is 3/4 of the
 total device memory, and it can be changed with a :cpp:`ParmParse`
-parameter, ``amrex.the_arena_init_size``, in the unit of bytes.  The default
-initial size for other arenas is 8388608 (i.e., 8 MB).  For
+parameter, ``amrex.the_arena_init_size``, in the unit of bytes. The default
+can also be changed with an environment variable
+``AMREX_THE_ARENA_INIT_SIZE=X``, where ``X`` is the number of bytes. When
+both the :cpp:`ParmParse` parameter and the environment variable are
+present, the former will override the latter. In both cases, the number
+string could have optional single quotes ``'`` as separators (e.g.,
+``10'000'000'000``). It may also use floating-point notation (``2.5e10``),
+as long as converting it does not introduce any loss of precision.
+
+The default initial size for other arenas is 8388608 (i.e., 8 MB).  For
 :cpp:`The_Managed_Arena()` and :cpp:`The_Device_Arena()`, it can be changed
 with ``amrex.the_managed_arena_init_size`` and
 ``amrex.the_device_arena_init_size``, respectively, if they are not an alias
diff --git a/Src/Base/AMReX_Arena.cpp b/Src/Base/AMReX_Arena.cpp
@@ -6,6 +6,7 @@
 
 #include <AMReX.H>
 #include <AMReX_BLProfiler.H>
+#include <AMReX_IParser.H>
 #include <AMReX_Print.H>
 #include <AMReX_ParallelDescriptor.H>
 #include <AMReX_ParmParse.H>
@@ -362,6 +363,13 @@ Arena::Initialize (bool minimal)
     the_pinned_arena_release_threshold = Gpu::Device::totalGlobalMem() / Gpu::Device::numDevicePartners() / 2L;
 #endif
 
+    // Overwrite the initial size with environment variables
+    if (char const* init_size_p = std::getenv("AMREX_THE_ARENA_INIT_SIZE")) {
+        IParser iparser(init_size_p);
+        auto exe = iparser.compileHost<0>();
+        the_arena_init_size = exe();
+    }
+
     ParmParse pp("amrex");
     pp.queryAdd(        "the_arena_init_size",         the_arena_init_size);
     pp.queryAdd( "the_device_arena_init_size",  the_device_arena_init_size);
diff --git a/Tests/Algebra/GMRES/main.cpp b/Tests/Algebra/GMRES/main.cpp
@@ -113,7 +113,11 @@ int main (int argc, char* argv[])
         amrex::Axpy(xvec, Real(-1.0), exact);
         auto error = xvec.norminf();
         amrex::Print() << " Max norm error: " << error << "\n";
+#ifdef AMREX_USE_FLOAT
+        AMREX_ALWAYS_ASSERT(error < eps);
+#else
         AMREX_ALWAYS_ASSERT(error*10 < eps);
+#endif
     }
     amrex::Finalize();
 }
diff --git a/Tests/CommType/main.cpp b/Tests/CommType/main.cpp
@@ -12,9 +12,9 @@ int main(int argc, char* argv[])
     int ret_code = EXIT_SUCCESS;
 
     {
-        int ncells = 128;
+        int ncells = 64;
         BoxArray ba(Box(IntVect(0), IntVect(ncells-1)));
-        ba.maxSize(32);
+        ba.maxSize(16);
         ba.convert(IntVect(1));
         DistributionMapping dm(ba);
 
diff --git a/Tests/FFT/Batch/main.cpp b/Tests/FFT/Batch/main.cpp
@@ -106,7 +106,7 @@ int main (int argc, char* argv[])
             auto error = mf2.norminf(0, batch_size, IntVect(0));
             amrex::Print() << "  Expected to be close to zero: " << error << "\n";
 #ifdef AMREX_USE_FLOAT
-            auto eps = 1.e-6f;
+            auto eps = 3.e-6F;
 #else
             auto eps = 1.e-13;
 #endif
@@ -133,7 +133,7 @@ int main (int argc, char* argv[])
             auto error = errmf.norminf(0, batch_size, IntVect(0));
             amrex::Print() << "  Expected to be close to zero: " << error << "\n";
 #ifdef AMREX_USE_FLOAT
-            auto eps = 0.5e-6f;
+            auto eps = 3.e-6F;
 #else
             auto eps = 1.e-15;
 #endif
@@ -156,7 +156,7 @@ int main (int argc, char* argv[])
             auto error = mf2.norminf(0, batch_size, IntVect(0));
             amrex::Print() << "  Expected to be close to zero: " << error << "\n";
 #ifdef AMREX_USE_FLOAT
-            auto eps = 1.e-6f;
+            auto eps = 3.e-6F;
 #else
             auto eps = 1.e-13;
 #endif
diff --git a/Tests/FFT/RawPtr/main.cpp b/Tests/FFT/RawPtr/main.cpp
@@ -69,7 +69,7 @@ int main (int argc, char* argv[])
                      });
         amrex::Print() << "  Expected to be close to zero: " << error << "\n";
 #ifdef AMREX_USE_FLOAT
-        auto eps = 1.e-6f;
+        auto eps = 3.e-6F;
 #else
         auto eps = 1.e-13;
 #endif
@@ -124,7 +124,7 @@ int main (int argc, char* argv[])
                      });
         amrex::Print() << "  Expected to be close to zero: " << error << "\n";
 #ifdef AMREX_USE_FLOAT
-        auto eps = 1.e-6f;
+        auto eps = 3.e-6F;
 #else
         auto eps = 1.e-13;
 #endif
diff --git a/Tests/LinearSolvers/NodalPoisson/MyTest.cpp b/Tests/LinearSolvers/NodalPoisson/MyTest.cpp
@@ -166,6 +166,9 @@ MyTest::readParameters ()
     pp.query("max_iter", max_iter);
     pp.query("max_fmg_iter", max_fmg_iter);
     pp.query("reltol", reltol);
+#ifdef AMREX_USE_FLOAT
+        reltol = std::max(reltol, 1.e-5F);
+#endif
 
     pp.query("gpu_regtest", gpu_regtest);
 
diff --git a/Tests/LinearSolvers/Nodal_Projection_EB/main.cpp b/Tests/LinearSolvers/Nodal_Projection_EB/main.cpp
@@ -249,7 +249,11 @@ int main (int argc, char* argv[])
         //    nodal_solver.setBottomSolver(MLMG::BottomSolver::hypre);
 
         // Define the relative tolerance
+#ifdef AMREX_USE_FLOAT
+        Real reltol = 2.e-4;
+#else
         Real reltol = 1.e-8;
+#endif
 
         // Define the absolute tolerance; note that this argument is optional
         Real abstol = 1.e-15;
diff --git a/Tests/Parser/main.cpp b/Tests/Parser/main.cpp
diff --git a/Tests/Particles/NeighborParticles/CMakeLists.txt b/Tests/Particles/NeighborParticles/CMakeLists.txt

Original file line number	Diff line number	Diff line change
`@@ -113,7 +113,11 @@ int main (int argc, char* argv[])`
`113`	`113`	`amrex::Axpy(xvec, Real(-1.0), exact);`
`114`	`114`	`auto error = xvec.norminf();`
`115`	`115`	`amrex::Print() << " Max norm error: " << error << "\n";`
	`116`	`+#ifdef AMREX_USE_FLOAT`
	`117`	`+ AMREX_ALWAYS_ASSERT(error < eps);`
	`118`	`+#else`
`116`	`119`	`AMREX_ALWAYS_ASSERT(error*10 < eps);`
	`120`	`+#endif`
`117`	`121`	`}`
`118`	`122`	`amrex::Finalize();`
`119`	`123`	`}`