From 49d00efbc549bb081cf9ed2204674b9382c661cb Mon Sep 17 00:00:00 2001 From: Luke Roberts Date: Wed, 4 Oct 2023 18:04:28 -0600 Subject: [PATCH] changes to make things work on gpu --- example/poisson_gmg/poisson_equation.hpp | 1 - example/poisson_gmg/poisson_package.hpp | 199 ----------------------- src/solvers/mg_solver.hpp | 6 +- 3 files changed, 3 insertions(+), 203 deletions(-) diff --git a/example/poisson_gmg/poisson_equation.hpp b/example/poisson_gmg/poisson_equation.hpp index 62787a6f1889..ddfa80ba8913 100644 --- a/example/poisson_gmg/poisson_equation.hpp +++ b/example/poisson_gmg/poisson_equation.hpp @@ -101,7 +101,6 @@ class PoissonEquation { return TaskStatus::complete; } - private: template static parthenon::TaskStatus CalculateFluxes(std::shared_ptr> &md) { diff --git a/example/poisson_gmg/poisson_package.hpp b/example/poisson_gmg/poisson_package.hpp index dac446769e0b..a3b9a37dbf56 100644 --- a/example/poisson_gmg/poisson_package.hpp +++ b/example/poisson_gmg/poisson_package.hpp @@ -88,205 +88,6 @@ TaskStatus PrintChosenValues(std::shared_ptr> &md, return TaskStatus::complete; } -class flux_poisson { - public: - // std::vector RequiredMetadata - - template - parthenon::TaskID Ax(TL_t &tl, parthenon::TaskID depends_on, - std::shared_ptr> &md, bool only_interior, - bool do_flux_cor = false) { - auto flux_res = tl.AddTask(depends_on, CalculateFluxes, md); - if (do_flux_cor && !only_md_level) { - auto start_flxcor = - tl.AddTask(flux_res, parthenon::StartReceiveFluxCorrections, md); - auto send_flxcor = tl.AddTask(flux_res, parthenon::LoadAndSendFluxCorrections, md); - auto recv_flxcor = tl.AddTask(send_flxcor, parthenon::ReceiveFluxCorrections, md); - flux_res = tl.AddTask(recv_flxcor, parthenon::SetFluxCorrections, md); - } - return tl.AddTask(flux_res, FluxMultiplyMatrix, md, - only_interior); - } - - template - parthenon::TaskStatus SetDiagonal(std::shared_ptr> &md) { - using namespace parthenon; - const int ndim = md->GetMeshPointer()->ndim; - using TE = parthenon::TopologicalElement; - TE te = TE::CC; - IndexRange ib = md->GetBoundsI(IndexDomain::interior, te); - IndexRange jb = md->GetBoundsJ(IndexDomain::interior, te); - IndexRange kb = md->GetBoundsK(IndexDomain::interior, te); - - auto pkg = md->GetMeshPointer()->packages.Get("poisson_package"); - const auto alpha = pkg->Param("diagonal_alpha"); - - int nblocks = md->NumBlocks(); - std::vector include_block(nblocks, true); - - if (only_md_level) { - for (int b = 0; b < nblocks; ++b) - include_block[b] = (md->grid.logical_level == - md->GetBlockData(b)->GetBlockPointer()->loc.level()); - } - - auto desc = parthenon::MakePackDescriptor(md.get()); - auto pack = desc.GetPack(md.get(), include_block); - parthenon::par_for( - DEFAULT_LOOP_PATTERN, "StoreDiagonal", DevExecSpace(), 0, pack.GetNBlocks() - 1, - kb.s, kb.e, jb.s, jb.e, ib.s, ib.e, - KOKKOS_LAMBDA(const int b, const int k, const int j, const int i) { - const auto &coords = pack.GetCoordinates(b); - // Build the unigrid diagonal of the matrix - Real dx1 = coords.template Dxc(k, j, i); - Real diag_elem = - -(pack(b, TE::F1, D(), k, j, i) + pack(b, TE::F1, D(), k, j, i + 1)) / - (dx1 * dx1) - - alpha; - if (ndim > 1) { - Real dx2 = coords.template Dxc(k, j, i); - diag_elem -= - (pack(b, TE::F2, D(), k, j, i) + pack(b, TE::F2, D(), k, j + 1, i)) / - (dx2 * dx2); - } - if (ndim > 2) { - Real dx3 = coords.template Dxc(k, j, i); - diag_elem -= - (pack(b, TE::F3, D(), k, j, i) + pack(b, TE::F3, D(), k + 1, j, i)) / - (dx3 * dx3); - } - pack(b, te, diag_t(), k, j, i) = diag_elem; - }); - return TaskStatus::complete; - } - - private: - template - static parthenon::TaskStatus - CalculateFluxes(std::shared_ptr> &md) { - using namespace parthenon; - const int ndim = md->GetMeshPointer()->ndim; - using TE = parthenon::TopologicalElement; - TE te = TE::CC; - IndexRange ib = md->GetBoundsI(IndexDomain::interior, te); - IndexRange jb = md->GetBoundsJ(IndexDomain::interior, te); - IndexRange kb = md->GetBoundsK(IndexDomain::interior, te); - - using TE = parthenon::TopologicalElement; - - int nblocks = md->NumBlocks(); - std::vector include_block(nblocks, true); - - if (only_md_level) { - for (int b = 0; b < nblocks; ++b) - include_block[b] = (md->grid.logical_level == - md->GetBlockData(b)->GetBlockPointer()->loc.level()); - } - - auto desc = - parthenon::MakePackDescriptor(md.get(), {}, {PDOpt::WithFluxes}); - auto pack = desc.GetPack(md.get(), include_block); - parthenon::par_for( - DEFAULT_LOOP_PATTERN, "CaclulateFluxes", DevExecSpace(), 0, pack.GetNBlocks() - 1, - kb.s, kb.e, jb.s, jb.e, ib.s, ib.e, - KOKKOS_LAMBDA(const int b, const int k, const int j, const int i) { - const auto &coords = pack.GetCoordinates(b); - Real dx1 = coords.template Dxc(k, j, i); - pack.flux(b, X1DIR, var_t(), k, j, i) = - pack(b, TE::F1, D(), k, j, i) / dx1 * - (pack(b, te, var_t(), k, j, i - 1) - pack(b, te, var_t(), k, j, i)); - if (i == ib.e) - pack.flux(b, X1DIR, var_t(), k, j, i + 1) = - pack(b, TE::F1, D(), k, j, i + 1) / dx1 * - (pack(b, te, var_t(), k, j, i) - pack(b, te, var_t(), k, j, i + 1)); - - if (ndim > 1) { - Real dx2 = coords.template Dxc(k, j, i); - pack.flux(b, X2DIR, var_t(), k, j, i) = - pack(b, TE::F2, D(), k, j, i) * - (pack(b, te, var_t(), k, j - 1, i) - pack(b, te, var_t(), k, j, i)) / dx2; - if (j == jb.e) - pack.flux(b, X2DIR, var_t(), k, j + 1, i) = - pack(b, TE::F2, D(), k, j + 1, i) * - (pack(b, te, var_t(), k, j, i) - pack(b, te, var_t(), k, j + 1, i)) / - dx2; - } - - if (ndim > 2) { - Real dx3 = coords.template Dxc(k, j, i); - pack.flux(b, X3DIR, var_t(), k, j, i) = - pack(b, TE::F3, D(), k, j, i) * - (pack(b, te, var_t(), k - 1, j, i) - pack(b, te, var_t(), k, j, i)) / dx3; - if (k == kb.e) - pack.flux(b, X2DIR, var_t(), k + 1, j, i) = - pack(b, TE::F3, D(), k + 1, j, i) * - (pack(b, te, var_t(), k, j, i) - pack(b, te, var_t(), k + 1, j, i)) / - dx3; - } - }); - return TaskStatus::complete; - } - - template - static parthenon::TaskStatus - FluxMultiplyMatrix(std::shared_ptr> &md, bool only_interior) { - using namespace parthenon; - const int ndim = md->GetMeshPointer()->ndim; - using TE = parthenon::TopologicalElement; - TE te = TE::CC; - IndexRange ib = md->GetBoundsI(IndexDomain::interior, te); - IndexRange jb = md->GetBoundsJ(IndexDomain::interior, te); - IndexRange kb = md->GetBoundsK(IndexDomain::interior, te); - - auto pkg = md->GetMeshPointer()->packages.Get("poisson_package"); - const auto alpha = pkg->Param("diagonal_alpha"); - - int nblocks = md->NumBlocks(); - std::vector include_block(nblocks, true); - if (only_interior) { - for (int b = 0; b < nblocks; ++b) - include_block[b] = md->GetBlockData(b)->GetBlockPointer()->neighbors.size() == 0; - } - - if (only_md_level) { - for (int b = 0; b < nblocks; ++b) - include_block[b] = - include_block[b] && (md->grid.logical_level == - md->GetBlockData(b)->GetBlockPointer()->loc.level()); - } - - auto desc = - parthenon::MakePackDescriptor(md.get(), {}, {PDOpt::WithFluxes}); - auto pack = desc.GetPack(md.get(), include_block); - parthenon::par_for( - DEFAULT_LOOP_PATTERN, "FluxMultiplyMatrix", DevExecSpace(), 0, - pack.GetNBlocks() - 1, kb.s, kb.e, jb.s, jb.e, ib.s, ib.e, - KOKKOS_LAMBDA(const int b, const int k, const int j, const int i) { - const auto &coords = pack.GetCoordinates(b); - Real dx1 = coords.template Dxc(k, j, i); - pack(b, te, out_t(), k, j, i) = -alpha * pack(b, te, in_t(), k, j, i); - pack(b, te, out_t(), k, j, i) += (pack.flux(b, X1DIR, in_t(), k, j, i) - - pack.flux(b, X1DIR, in_t(), k, j, i + 1)) / - dx1; - - if (ndim > 1) { - Real dx2 = coords.template Dxc(k, j, i); - pack(b, te, out_t(), k, j, i) += (pack.flux(b, X2DIR, in_t(), k, j, i) - - pack.flux(b, X2DIR, in_t(), k, j + 1, i)) / - dx2; - } - - if (ndim > 2) { - Real dx3 = coords.template Dxc(k, j, i); - pack(b, te, out_t(), k, j, i) += (pack.flux(b, X3DIR, in_t(), k, j, i) - - pack.flux(b, X3DIR, in_t(), k + 1, j, i)) / - dx3; - } - }); - return TaskStatus::complete; - } -}; - } // namespace poisson_package #endif // EXAMPLE_POISSON_GMG_POISSON_PACKAGE_HPP_ diff --git a/src/solvers/mg_solver.hpp b/src/solvers/mg_solver.hpp index 824fa888ae97..9856890cb886 100644 --- a/src/solvers/mg_solver.hpp +++ b/src/solvers/mg_solver.hpp @@ -128,7 +128,6 @@ class MGSolver { int GetCurrentIterations() const { return iter_counter; } Real GetFinalResidual() const { return final_residual; } int GetFinalIterations() const { return final_iteration; } - protected: MGParams params_; int iter_counter; @@ -136,7 +135,9 @@ class MGSolver { equations eqs_; Real final_residual; int final_iteration; - + // These functions apparently have to be public to compile with cuda since + // they contain device side lambdas + public: enum class GSType { all, red, black }; template ndim; bool multilevel = (level != min_level); TaskID last_task;