From 8d46fd6fa25e4f3961f6a94a961c5c22d885890a Mon Sep 17 00:00:00 2001
From: KARA Abdelhadi 265943 <abdelhadi.kara@cea.fr>
Date: Tue, 19 May 2026 14:24:48 +0200
Subject: [PATCH 01/11]  fill exact solution on host

---
 include/GMGPolar/solver.h | 48 ++++++++++++++++++++++-----------------
 1 file changed, 27 insertions(+), 21 deletions(-)
diff --git a/include/GMGPolar/solver.h b/include/GMGPolar/solver.h
index 927327da..6206af38 100644
--- a/include/GMGPolar/solver.h
+++ b/include/GMGPolar/solver.h
@@ -591,28 +591,34 @@ std::pair<double, double> GMGPolar<DomainGeometry, DensityProfileCoefficients>::
 
     assert(solution.size() == error.size());
     assert(std::ssize(solution) == grid.numberOfNodes());
-
-#pragma omp parallel num_threads(max_omp_threads_)
-    {
-#pragma omp for nowait
-        for (int i_r = 0; i_r < grid.numberSmootherCircles(); i_r++) {
-            double r = grid.radius(i_r);
-            for (int i_theta = 0; i_theta < grid.ntheta(); i_theta++) {
-                double theta = grid.theta(i_theta);
-                error[grid.index(i_r, i_theta)] =
-                    exact_solution.exact_solution(r, theta) - solution[grid.index(i_r, i_theta)];
-            }
-        }
-#pragma omp for nowait
-        for (int i_theta = 0; i_theta < grid.ntheta(); i_theta++) {
+    Vector<double> solution_d("solution_d", solution.size());
+    HostVector<double> exact_sol_h("exact_sol_h", solution.size());
+    Vector<double> exact_sol_d("exact_sol", solution.size());
+    Vector<double> error_d("error_d", solution.size());
+
+    Kokkos::parallel_for(
+        "fill exact sol on host",
+        Kokkos::MDRangePolicy<Kokkos::DefaultHostExecutionSpace, Kokkos::Rank<2>>({0, 0}, {grid.nr(), grid.ntheta()}),
+        KOKKOS_LAMBDA(const int i_r, const int i_theta) {
+            double r                              = grid.radius(i_r);
+            double theta                          = grid.theta(i_theta);
+            exact_sol_h(grid.index(i_r, i_theta)) = exact_solution.exact_solution(r, theta);
+        });
+
+    Kokkos::deep_copy(exact_sol_d, exact_sol_h);
+    Kokkos::deep_copy(solution_d, solution);
+
+    Kokkos::parallel_for(
+        "compute error on device",
+        Kokkos::MDRangePolicy<Kokkos::DefaultExecutionSpace, Kokkos::Rank<2>>({0, 0}, {grid.nr(), grid.ntheta()}),
+        KOKKOS_LAMBDA(const int i_r, const int i_theta) {
+            double r     = grid.radius(i_r);
             double theta = grid.theta(i_theta);
-            for (int i_r = grid.numberSmootherCircles(); i_r < grid.nr(); i_r++) {
-                double r = grid.radius(i_r);
-                error[grid.index(i_r, i_theta)] =
-                    exact_solution.exact_solution(r, theta) - solution[grid.index(i_r, i_theta)];
-            }
-        }
-    }
+            error_d[grid.index(i_r, i_theta)] =
+                exact_sol_d(grid.index(i_r, i_theta)) - solution_d[grid.index(i_r, i_theta)];
+        });
+
+    Kokkos::deep_copy(error, error_d);
     HostConstVector<double> c_error = error;
     double weighted_euclidean_error = l2_norm(c_error) / std::sqrt(grid.numberOfNodes());
     double infinity_error           = infinity_norm(c_error);

From a215fe67e1ea69f299a58eed57cc948581c1545b Mon Sep 17 00:00:00 2001
From: KARA Abdelhadi 265943 <abdelhadi.kara@cea.fr>
Date: Tue, 19 May 2026 17:03:35 +0200
Subject: [PATCH 02/11] compute and store exact solution once, pass it as a
 Vector

---
 include/GMGPolar/gmgpolar.h |  9 +++---
 include/GMGPolar/solver.h   | 56 +++++++++++++++++--------------------
 2 files changed, 31 insertions(+), 34 deletions(-)

diff --git a/include/GMGPolar/gmgpolar.h b/include/GMGPolar/gmgpolar.h
index 1f46bfe3..875ad3bc 100644
--- a/include/GMGPolar/gmgpolar.h
+++ b/include/GMGPolar/gmgpolar.h
@@ -134,7 +134,7 @@ class GMGPolar : public IGMGPolar
     std::vector<std::pair<double, double>> exact_errors_;
     std::pair<double, double> computeExactError(Level<DomainGeometry, DensityProfileCoefficients>& level,
                                                 HostConstVector<double> solution, HostVector<double> error,
-                                                const ExactSolution& exact_solution);
+                                                HostConstVector<double> exact_solution);
 
     /* --------------- */
     /* Setup Functions */
@@ -153,13 +153,14 @@ class GMGPolar : public IGMGPolar
     /* Solve Functions */
     void fullMultigridApproximation(MultigridCycleType FMG_cycle, int FMG_iterations);
     void solveMultigrid(double& initial_residual_norm, double& current_residual_norm,
-                        double& current_relative_residual_norm);
-    void solvePCG(double& initial_residual_norm, double& current_residual_norm, double& current_relative_residual_norm);
+                        double& current_relative_residual_norm, HostConstVector<double> exact_solution);
+    void solvePCG(double& initial_residual_norm, double& current_residual_norm, double& current_relative_residual_norm,
+                  HostConstVector<double> exact_solution);
     double residualNorm(const ResidualNormType& norm_type,
                         const Level<DomainGeometry, DensityProfileCoefficients>& level,
                         HostConstVector<double> residual) const;
     void evaluateExactError(Level<DomainGeometry, DensityProfileCoefficients>& level,
-                            const ExactSolution& exact_solution);
+                            HostConstVector<double> exact_solution);
     void updateResidualNorms(Level<DomainGeometry, DensityProfileCoefficients>& level, int iteration,
                              double& initial_residual_norm, double& current_residual_norm,
                              double& current_relative_residual_norm);
diff --git a/include/GMGPolar/solver.h b/include/GMGPolar/solver.h
index 6206af38..d43a52cf 100644
--- a/include/GMGPolar/solver.h
+++ b/include/GMGPolar/solver.h
@@ -95,9 +95,20 @@ void GMGPolar<DomainGeometry, DensityProfileCoefficients>::solve(const BoundaryC
     /* ---------------------------------------------- */
     LIKWID_STOP("Solver");
     auto start_check_exact_error = std::chrono::high_resolution_clock::now();
+    // fill exact solution on host to avoid repeat same comptuation
+    HostVector<double> exact_sol("exact_sol", level.solution().size());
+    const PolarGrid& grid = level.grid();
+    Kokkos::parallel_for(
+        "fill exact sol on host",
+        Kokkos::MDRangePolicy<Kokkos::DefaultHostExecutionSpace, Kokkos::Rank<2>>({0, 0}, {grid.nr(), grid.ntheta()}),
+        KOKKOS_LAMBDA(const int i_r, const int i_theta) {
+            double r                            = grid.radius(i_r);
+            double theta                        = grid.theta(i_theta);
+            exact_sol(grid.index(i_r, i_theta)) = exact_solution_->exact_solution(r, theta);
+        });
 
     if (exact_solution_ != nullptr)
-        evaluateExactError(level, *exact_solution_);
+        evaluateExactError(level, exact_sol);
 
     auto end_check_exact_error = std::chrono::high_resolution_clock::now();
     t_check_exact_error_ += std::chrono::duration<double>(end_check_exact_error - start_check_exact_error).count();
@@ -121,7 +132,7 @@ void GMGPolar<DomainGeometry, DensityProfileCoefficients>::solve(const BoundaryC
         if (!PCG_) {
             // Solve A*x = b directly using multigrid cycles (V/W/F-cycle)
             // until convergence or max_iterations_ is reached.
-            solveMultigrid(initial_residual_norm, current_residual_norm, current_relative_residual_norm);
+            solveMultigrid(initial_residual_norm, current_residual_norm, current_relative_residual_norm, exact_sol);
         }
         else {
             // Solve A*x = b using Preconditioned Conjugate Gradient (PCG),
@@ -129,7 +140,7 @@ void GMGPolar<DomainGeometry, DensityProfileCoefficients>::solve(const BoundaryC
             // cycle approximates the action of A^{-1} at each PCG iteration).
             auto start_conjugate_gradient = std::chrono::high_resolution_clock::now();
 
-            solvePCG(initial_residual_norm, current_residual_norm, current_relative_residual_norm);
+            solvePCG(initial_residual_norm, current_residual_norm, current_relative_residual_norm, exact_sol);
 
             auto end_conjugate_gradient = std::chrono::high_resolution_clock::now();
             t_conjugate_gradient_ +=
@@ -170,7 +181,7 @@ void GMGPolar<DomainGeometry, DensityProfileCoefficients>::solve(const BoundaryC
     if (paraview_) {
         writeToVTK("output_solution", level, level.solution());
         if (exact_solution_ != nullptr) {
-            computeExactError(level, level.solution(), level.residual(), *exact_solution_);
+            computeExactError(level, level.solution(), level.residual(), exact_sol);
             writeToVTK("output_error", level, level.residual());
         }
     }
@@ -215,7 +226,8 @@ void GMGPolar<DomainGeometry, DensityProfileCoefficients>::fullMultigridApproxim
 template <concepts::DomainGeometry DomainGeometry, concepts::DensityProfileCoefficients DensityProfileCoefficients>
 void GMGPolar<DomainGeometry, DensityProfileCoefficients>::solveMultigrid(double& initial_residual_norm,
                                                                           double& current_residual_norm,
-                                                                          double& current_relative_residual_norm)
+                                                                          double& current_relative_residual_norm,
+                                                                          HostConstVector<double> exact_solution)
 {
     Level<DomainGeometry, DensityProfileCoefficients>& level = levels_[0];
 
@@ -245,7 +257,7 @@ void GMGPolar<DomainGeometry, DensityProfileCoefficients>::solveMultigrid(double
         auto start_check_exact_error = std::chrono::high_resolution_clock::now();
 
         if (exact_solution_ != nullptr)
-            evaluateExactError(level, *exact_solution_);
+            evaluateExactError(level, exact_solution);
 
         auto end_check_exact_error = std::chrono::high_resolution_clock::now();
         t_check_exact_error_ += std::chrono::duration<double>(end_check_exact_error - start_check_exact_error).count();
@@ -288,7 +300,8 @@ void GMGPolar<DomainGeometry, DensityProfileCoefficients>::solveMultigrid(double
 template <concepts::DomainGeometry DomainGeometry, concepts::DensityProfileCoefficients DensityProfileCoefficients>
 void GMGPolar<DomainGeometry, DensityProfileCoefficients>::solvePCG(double& initial_residual_norm,
                                                                     double& current_residual_norm,
-                                                                    double& current_relative_residual_norm)
+                                                                    double& current_relative_residual_norm,
+                                                                    HostConstVector<double> exact_solution)
 {
     Level<DomainGeometry, DensityProfileCoefficients>& level = levels_[0];
 
@@ -355,7 +368,7 @@ void GMGPolar<DomainGeometry, DensityProfileCoefficients>::solvePCG(double& init
         auto start_check_exact_error = std::chrono::high_resolution_clock::now();
 
         if (exact_solution_ != nullptr)
-            exact_errors_.push_back(computeExactError(level, pcg_solution_, level.residual(), *exact_solution_));
+            exact_errors_.push_back(computeExactError(level, pcg_solution_, level.residual(), exact_solution));
 
         auto end_check_exact_error = std::chrono::high_resolution_clock::now();
         t_check_exact_error_ += std::chrono::duration<double>(end_check_exact_error - start_check_exact_error).count();
@@ -574,7 +587,7 @@ void GMGPolar<DomainGeometry, DensityProfileCoefficients>::initRhsHierarchy(Host
 
 template <concepts::DomainGeometry DomainGeometry, concepts::DensityProfileCoefficients DensityProfileCoefficients>
 void GMGPolar<DomainGeometry, DensityProfileCoefficients>::evaluateExactError(
-    Level<DomainGeometry, DensityProfileCoefficients>& level, const ExactSolution& exact_solution)
+    Level<DomainGeometry, DensityProfileCoefficients>& level, HostConstVector<double> exact_solution)
 {
     // Compute the weighted L2 norm and infinity norm of the error between the numerical and exact solution.
     // The results are stored as a pair: (weighted L2 error, infinity error).
@@ -584,41 +597,24 @@ void GMGPolar<DomainGeometry, DensityProfileCoefficients>::evaluateExactError(
 template <concepts::DomainGeometry DomainGeometry, concepts::DensityProfileCoefficients DensityProfileCoefficients>
 std::pair<double, double> GMGPolar<DomainGeometry, DensityProfileCoefficients>::computeExactError(
     Level<DomainGeometry, DensityProfileCoefficients>& level, HostConstVector<double> solution,
-    HostVector<double> error, const ExactSolution& exact_solution)
+    HostVector<double> error, HostConstVector<double> exact_solution)
 {
     const PolarGrid& grid                                                    = level.grid();
     const LevelCache<DomainGeometry, DensityProfileCoefficients>& levelCache = level.levelCache();
 
     assert(solution.size() == error.size());
     assert(std::ssize(solution) == grid.numberOfNodes());
-    Vector<double> solution_d("solution_d", solution.size());
-    HostVector<double> exact_sol_h("exact_sol_h", solution.size());
-    Vector<double> exact_sol_d("exact_sol", solution.size());
-    Vector<double> error_d("error_d", solution.size());
-
-    Kokkos::parallel_for(
-        "fill exact sol on host",
-        Kokkos::MDRangePolicy<Kokkos::DefaultHostExecutionSpace, Kokkos::Rank<2>>({0, 0}, {grid.nr(), grid.ntheta()}),
-        KOKKOS_LAMBDA(const int i_r, const int i_theta) {
-            double r                              = grid.radius(i_r);
-            double theta                          = grid.theta(i_theta);
-            exact_sol_h(grid.index(i_r, i_theta)) = exact_solution.exact_solution(r, theta);
-        });
-
-    Kokkos::deep_copy(exact_sol_d, exact_sol_h);
-    Kokkos::deep_copy(solution_d, solution);
 
     Kokkos::parallel_for(
         "compute error on device",
-        Kokkos::MDRangePolicy<Kokkos::DefaultExecutionSpace, Kokkos::Rank<2>>({0, 0}, {grid.nr(), grid.ntheta()}),
+        Kokkos::MDRangePolicy<Kokkos::DefaultHostExecutionSpace, Kokkos::Rank<2>>({0, 0}, {grid.nr(), grid.ntheta()}),
         KOKKOS_LAMBDA(const int i_r, const int i_theta) {
             double r     = grid.radius(i_r);
             double theta = grid.theta(i_theta);
-            error_d[grid.index(i_r, i_theta)] =
-                exact_sol_d(grid.index(i_r, i_theta)) - solution_d[grid.index(i_r, i_theta)];
+            error[grid.index(i_r, i_theta)] =
+                exact_solution(grid.index(i_r, i_theta)) - solution[grid.index(i_r, i_theta)];
         });
 
-    Kokkos::deep_copy(error, error_d);
     HostConstVector<double> c_error = error;
     double weighted_euclidean_error = l2_norm(c_error) / std::sqrt(grid.numberOfNodes());
     double infinity_error           = infinity_norm(c_error);

From e7baa1ef48ba14f532a42b9777c49f984ffbc127 Mon Sep 17 00:00:00 2001
From: KARA Abdelhadi 265943 <abdelhadi.kara@cea.fr>
Date: Tue, 19 May 2026 17:08:06 +0200
Subject: [PATCH 03/11] fix typo

---
 include/GMGPolar/solver.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/include/GMGPolar/solver.h b/include/GMGPolar/solver.h
index d43a52cf..11f37922 100644
--- a/include/GMGPolar/solver.h
+++ b/include/GMGPolar/solver.h
@@ -95,7 +95,7 @@ void GMGPolar<DomainGeometry, DensityProfileCoefficients>::solve(const BoundaryC
     /* ---------------------------------------------- */
     LIKWID_STOP("Solver");
     auto start_check_exact_error = std::chrono::high_resolution_clock::now();
-    // fill exact solution on host to avoid repeat same comptuation
+    // fill exact solution on host to avoid repeat same computation
     HostVector<double> exact_sol("exact_sol", level.solution().size());
     const PolarGrid& grid = level.grid();
     Kokkos::parallel_for(

From 65a99dc75115850c059ccb96b83a7e19deaf5143 Mon Sep 17 00:00:00 2001
From: KARA Abdelhadi 265943 <abdelhadi.kara@cea.fr>
Date: Wed, 20 May 2026 10:34:19 +0200
Subject: [PATCH 04/11] use class_lambda for host parallel loop

---
 include/GMGPolar/solver.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/include/GMGPolar/solver.h b/include/GMGPolar/solver.h
index 53bd7815..7ce407ee 100644
--- a/include/GMGPolar/solver.h
+++ b/include/GMGPolar/solver.h
@@ -608,7 +608,7 @@ std::pair<double, double> GMGPolar<DomainGeometry, DensityProfileCoefficients>::
     Kokkos::parallel_for(
         "compute error on host",
         Kokkos::MDRangePolicy<Kokkos::DefaultHostExecutionSpace, Kokkos::Rank<2>>({0, 0}, {grid.nr(), grid.ntheta()}),
-        KOKKOS_LAMBDA(const int i_r, const int i_theta) {
+        KOKKOS_CLASS_LAMBDA(const int i_r, const int i_theta) {
             double r     = grid.radius(i_r);
             double theta = grid.theta(i_theta);
             error[grid.index(i_r, i_theta)] =

From 678e9158a3986b44732dadda6288db7f5fa3166f Mon Sep 17 00:00:00 2001
From: KARA Abdelhadi 265943 <abdelhadi.kara@cea.fr>
Date: Wed, 20 May 2026 10:49:14 +0200
Subject: [PATCH 05/11] pass by reference in cpu loops

---
 include/GMGPolar/solver.h | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/include/GMGPolar/solver.h b/include/GMGPolar/solver.h
index 7ce407ee..95b5e050 100644
--- a/include/GMGPolar/solver.h
+++ b/include/GMGPolar/solver.h
@@ -101,7 +101,7 @@ void GMGPolar<DomainGeometry, DensityProfileCoefficients>::solve(const BoundaryC
     Kokkos::parallel_for(
         "fill exact sol on host",
         Kokkos::MDRangePolicy<Kokkos::DefaultHostExecutionSpace, Kokkos::Rank<2>>({0, 0}, {grid.nr(), grid.ntheta()}),
-        KOKKOS_LAMBDA(const int i_r, const int i_theta) {
+        [&](const int i_r, const int i_theta) {
             double r                            = grid.radius(i_r);
             double theta                        = grid.theta(i_theta);
             exact_sol(grid.index(i_r, i_theta)) = exact_solution_->exact_solution(r, theta);
@@ -608,7 +608,7 @@ std::pair<double, double> GMGPolar<DomainGeometry, DensityProfileCoefficients>::
     Kokkos::parallel_for(
         "compute error on host",
         Kokkos::MDRangePolicy<Kokkos::DefaultHostExecutionSpace, Kokkos::Rank<2>>({0, 0}, {grid.nr(), grid.ntheta()}),
-        KOKKOS_CLASS_LAMBDA(const int i_r, const int i_theta) {
+        [&](const int i_r, const int i_theta) {
             double r     = grid.radius(i_r);
             double theta = grid.theta(i_theta);
             error[grid.index(i_r, i_theta)] =

From 494289e9890103cadde4588425ccdac8c7c69e71 Mon Sep 17 00:00:00 2001
From: KARA Abdelhadi 265943 <abdelhadi.kara@cea.fr>
Date: Thu, 21 May 2026 09:48:23 +0200
Subject: [PATCH 06/11] iterate over grid index, create if condition and 
 allocate exact_sol outside of it

---
 include/GMGPolar/solver.h | 42 +++++++++++++++++++--------------------
 1 file changed, 20 insertions(+), 22 deletions(-)

diff --git a/include/GMGPolar/solver.h b/include/GMGPolar/solver.h
index 14ea4b03..f86af352 100644
--- a/include/GMGPolar/solver.h
+++ b/include/GMGPolar/solver.h
@@ -95,21 +95,23 @@ void GMGPolar<DomainGeometry, DensityProfileCoefficients>::solve(const BoundaryC
     /* ---------------------------------------------- */
     LIKWID_STOP("Solver");
     auto start_check_exact_error = std::chrono::high_resolution_clock::now();
-    // fill exact solution on host to avoid repeat same computation
     HostVector<double> exact_sol("exact_sol", level.solution().size());
-    const PolarGrid& grid = level.grid();
-    Kokkos::parallel_for(
-        "fill exact sol on host",
-        Kokkos::MDRangePolicy<Kokkos::DefaultHostExecutionSpace, Kokkos::Rank<2>>({0, 0}, {grid.nr(), grid.ntheta()}),
-        [&](const int i_r, const int i_theta) {
-            double r                            = grid.radius(i_r);
-            double theta                        = grid.theta(i_theta);
-            exact_sol(grid.index(i_r, i_theta)) = exact_solution_->exact_solution(r, theta);
-        });
-
-    if (exact_solution_ != nullptr)
-        evaluateExactError(level, exact_sol);
+    if (exact_solution_ != nullptr) {
+        // fill exact solution on host to avoid repeat same computation
+        const PolarGrid& grid = level.grid();
+
+        Kokkos::parallel_for("fill exact sol on host",
+                             Kokkos::RangePolicy<Kokkos::DefaultHostExecutionSpace>({0, exact_sol.size()}),
+                             [&](const int grid_idx) {
+                                 int i_r, i_theta;
+                                 grid.multiIndex(grid_idx, i_r, i_theta);
+                                 double r            = grid.radius(i_r);
+                                 double theta        = grid.theta(i_theta);
+                                 exact_sol(grid_idx) = exact_solution_->exact_solution(r, theta);
+                             });
 
+        evaluateExactError(level, exact_sol);
+    }
     auto end_check_exact_error = std::chrono::high_resolution_clock::now();
     t_check_exact_error_ += std::chrono::duration<double>(end_check_exact_error - start_check_exact_error).count();
     LIKWID_START("Solver");
@@ -604,15 +606,11 @@ std::pair<double, double> GMGPolar<DomainGeometry, DensityProfileCoefficients>::
     assert(solution.size() == error.size());
     assert(std::ssize(solution) == grid.numberOfNodes());
 
-    Kokkos::parallel_for(
-        "compute error on host",
-        Kokkos::MDRangePolicy<Kokkos::DefaultHostExecutionSpace, Kokkos::Rank<2>>({0, 0}, {grid.nr(), grid.ntheta()}),
-        [&](const int i_r, const int i_theta) {
-            double r     = grid.radius(i_r);
-            double theta = grid.theta(i_theta);
-            error[grid.index(i_r, i_theta)] =
-                exact_solution(grid.index(i_r, i_theta)) - solution[grid.index(i_r, i_theta)];
-        });
+    Kokkos::parallel_for("compute error on host",
+                         Kokkos::RangePolicy<Kokkos::DefaultHostExecutionSpace>({0, exact_solution.size()}),
+                         [&](const int grid_idx) {
+                             error[grid_idx] = exact_solution(grid_idx) - solution[grid_idx];
+                         });
 
     HostConstVector<double> c_error = error;
     double weighted_euclidean_error = l2_norm(c_error) / std::sqrt(grid.numberOfNodes());

From bd98e908a106a8f594c12863e79ee69e2c0cc95f Mon Sep 17 00:00:00 2001
From: KARA Abdelhadi 265943 <abdelhadi.kara@cea.fr>
Date: Thu, 21 May 2026 10:06:30 +0200
Subject: [PATCH 07/11] harmonize exact_solution condition with the rest of the
 code

---
 include/GMGPolar/solver.h | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/include/GMGPolar/solver.h b/include/GMGPolar/solver.h
index f86af352..17f988f0 100644
--- a/include/GMGPolar/solver.h
+++ b/include/GMGPolar/solver.h
@@ -96,7 +96,7 @@ void GMGPolar<DomainGeometry, DensityProfileCoefficients>::solve(const BoundaryC
     LIKWID_STOP("Solver");
     auto start_check_exact_error = std::chrono::high_resolution_clock::now();
     HostVector<double> exact_sol("exact_sol", level.solution().size());
-    if (exact_solution_ != nullptr) {
+    if (exact_solution_) {
         // fill exact solution on host to avoid repeat same computation
         const PolarGrid& grid = level.grid();
 
@@ -182,7 +182,7 @@ void GMGPolar<DomainGeometry, DensityProfileCoefficients>::solve(const BoundaryC
 
     if (paraview_) {
         writeToVTK("output_solution", level, level.solution());
-        if (exact_solution_ != nullptr) {
+        if (exact_solution_) {
             computeExactError(level, level.solution(), level.residual(), exact_sol);
             writeToVTK("output_error", level, level.residual());
         }
@@ -258,7 +258,7 @@ void GMGPolar<DomainGeometry, DensityProfileCoefficients>::solveMultigrid(double
         LIKWID_STOP("Solver");
         auto start_check_exact_error = std::chrono::high_resolution_clock::now();
 
-        if (exact_solution_ != nullptr)
+        if (exact_solution_)
             evaluateExactError(level, exact_solution);
 
         auto end_check_exact_error = std::chrono::high_resolution_clock::now();
@@ -369,7 +369,7 @@ void GMGPolar<DomainGeometry, DensityProfileCoefficients>::solvePCG(double& init
         LIKWID_STOP("Solver");
         auto start_check_exact_error = std::chrono::high_resolution_clock::now();
 
-        if (exact_solution_ != nullptr)
+        if (exact_solution_)
             exact_errors_.push_back(computeExactError(level, pcg_solution_, level.residual(), exact_solution));
 
         auto end_check_exact_error = std::chrono::high_resolution_clock::now();

From cb335678c92566f8051792d1b09b60f1cc24eb4e Mon Sep 17 00:00:00 2001
From: KARA Abdelhadi 265943 <abdelhadi.kara@cea.fr>
Date: Thu, 21 May 2026 10:37:05 +0200
Subject: [PATCH 08/11] return to use of  multi dimensional loop for exact
 solution fill

---
 include/GMGPolar/solver.h | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/include/GMGPolar/solver.h b/include/GMGPolar/solver.h
index 17f988f0..b6554670 100644
--- a/include/GMGPolar/solver.h
+++ b/include/GMGPolar/solver.h
@@ -101,12 +101,12 @@ void GMGPolar<DomainGeometry, DensityProfileCoefficients>::solve(const BoundaryC
         const PolarGrid& grid = level.grid();
 
         Kokkos::parallel_for("fill exact sol on host",
-                             Kokkos::RangePolicy<Kokkos::DefaultHostExecutionSpace>({0, exact_sol.size()}),
-                             [&](const int grid_idx) {
-                                 int i_r, i_theta;
-                                 grid.multiIndex(grid_idx, i_r, i_theta);
+                             Kokkos::MDRangePolicy<Kokkos::DefaultHostExecutionSpace, Kokkos::Rank<2>>(
+                                 {0, 0}, {grid.nr(), grid.ntheta()}),
+                             [&](const int i_r, const int i_theta) {
                                  double r            = grid.radius(i_r);
                                  double theta        = grid.theta(i_theta);
+                                 const int grid_idx  = grid.index(i_r, i_theta);
                                  exact_sol(grid_idx) = exact_solution_->exact_solution(r, theta);
                              });
 

From af6c2cdd1279515fafa28d8b1c6a221f17bdfdf1 Mon Sep 17 00:00:00 2001
From: KARA Abdelhadi 265943 <abdelhadi.kara@cea.fr>
Date: Thu, 21 May 2026 12:23:45 +0200
Subject: [PATCH 09/11] split filling into 2 loops, use subtract function

---
 include/GMGPolar/solver.h | 21 ++++++++++++++-------
 1 file changed, 14 insertions(+), 7 deletions(-)

diff --git a/include/GMGPolar/solver.h b/include/GMGPolar/solver.h
index b6554670..10b1b005 100644
--- a/include/GMGPolar/solver.h
+++ b/include/GMGPolar/solver.h
@@ -100,15 +100,24 @@ void GMGPolar<DomainGeometry, DensityProfileCoefficients>::solve(const BoundaryC
         // fill exact solution on host to avoid repeat same computation
         const PolarGrid& grid = level.grid();
 
-        Kokkos::parallel_for("fill exact sol on host",
+        Kokkos::parallel_for("fill exact sol outter loop on r",
                              Kokkos::MDRangePolicy<Kokkos::DefaultHostExecutionSpace, Kokkos::Rank<2>>(
-                                 {0, 0}, {grid.nr(), grid.ntheta()}),
+                                 {0, 0}, {grid.numberSmootherCircles(), grid.ntheta()}),
                              [&](const int i_r, const int i_theta) {
                                  double r            = grid.radius(i_r);
                                  double theta        = grid.theta(i_theta);
                                  const int grid_idx  = grid.index(i_r, i_theta);
                                  exact_sol(grid_idx) = exact_solution_->exact_solution(r, theta);
                              });
+        Kokkos::parallel_for("fill exact sol outter loop on theta",
+                             Kokkos::MDRangePolicy<Kokkos::DefaultHostExecutionSpace, Kokkos::Rank<2>>(
+                                 {0, grid.numberSmootherCircles()}, {grid.ntheta(), grid.nr()}),
+                             [&](const int i_theta, const int i_r) {
+                                 double r            = grid.radius(i_r);
+                                 double theta        = grid.theta(i_theta);
+                                 const int grid_idx  = grid.index(i_r, i_theta);
+                                 exact_sol(grid_idx) = exact_solution_->exact_solution(r, theta);
+                             });
 
         evaluateExactError(level, exact_sol);
     }
@@ -606,11 +615,9 @@ std::pair<double, double> GMGPolar<DomainGeometry, DensityProfileCoefficients>::
     assert(solution.size() == error.size());
     assert(std::ssize(solution) == grid.numberOfNodes());
 
-    Kokkos::parallel_for("compute error on host",
-                         Kokkos::RangePolicy<Kokkos::DefaultHostExecutionSpace>({0, exact_solution.size()}),
-                         [&](const int grid_idx) {
-                             error[grid_idx] = exact_solution(grid_idx) - solution[grid_idx];
-                         });
+    Kokkos::deep_copy(error, solution);
+    // Compute the error as the difference between exact and numerical solution
+    subtract(error, exact_solution);
 
     HostConstVector<double> c_error = error;
     double weighted_euclidean_error = l2_norm(c_error) / std::sqrt(grid.numberOfNodes());

From 457cff1d230dff5b857685ed8c95d34f54e85dc7 Mon Sep 17 00:00:00 2001
From: KARA Abdelhadi 265943 <abdelhadi.kara@cea.fr>
Date: Thu, 21 May 2026 13:05:37 +0200
Subject: [PATCH 10/11] fix outer word typo

---
 include/GMGPolar/solver.h | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/include/GMGPolar/solver.h b/include/GMGPolar/solver.h
index 10b1b005..6b1586ee 100644
--- a/include/GMGPolar/solver.h
+++ b/include/GMGPolar/solver.h
@@ -100,7 +100,7 @@ void GMGPolar<DomainGeometry, DensityProfileCoefficients>::solve(const BoundaryC
         // fill exact solution on host to avoid repeat same computation
         const PolarGrid& grid = level.grid();
 
-        Kokkos::parallel_for("fill exact sol outter loop on r",
+        Kokkos::parallel_for("fill exact sol outer loop on r",
                              Kokkos::MDRangePolicy<Kokkos::DefaultHostExecutionSpace, Kokkos::Rank<2>>(
                                  {0, 0}, {grid.numberSmootherCircles(), grid.ntheta()}),
                              [&](const int i_r, const int i_theta) {
@@ -109,7 +109,7 @@ void GMGPolar<DomainGeometry, DensityProfileCoefficients>::solve(const BoundaryC
                                  const int grid_idx  = grid.index(i_r, i_theta);
                                  exact_sol(grid_idx) = exact_solution_->exact_solution(r, theta);
                              });
-        Kokkos::parallel_for("fill exact sol outter loop on theta",
+        Kokkos::parallel_for("fill exact sol outer loop on theta",
                              Kokkos::MDRangePolicy<Kokkos::DefaultHostExecutionSpace, Kokkos::Rank<2>>(
                                  {0, grid.numberSmootherCircles()}, {grid.ntheta(), grid.nr()}),
                              [&](const int i_theta, const int i_r) {

From 26da51e6c3014bf88036a9bbdd71300bbce04c24 Mon Sep 17 00:00:00 2001
From: KARA Abdelhadi 265943 <abdelhadi.kara@cea.fr>
Date: Thu, 21 May 2026 16:03:48 +0200
Subject: [PATCH 11/11] allocate exact solution only if needed

---
 include/GMGPolar/solver.h | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/include/GMGPolar/solver.h b/include/GMGPolar/solver.h
index 6b1586ee..efb1aac3 100644
--- a/include/GMGPolar/solver.h
+++ b/include/GMGPolar/solver.h
@@ -95,8 +95,9 @@ void GMGPolar<DomainGeometry, DensityProfileCoefficients>::solve(const BoundaryC
     /* ---------------------------------------------- */
     LIKWID_STOP("Solver");
     auto start_check_exact_error = std::chrono::high_resolution_clock::now();
-    HostVector<double> exact_sol("exact_sol", level.solution().size());
+    HostAllocatableVector<double> exact_sol;
     if (exact_solution_) {
+        exact_sol = HostVector<double>("exact_sol", level.solution().size());
         // fill exact solution on host to avoid repeat same computation
         const PolarGrid& grid = level.grid();