amrex/doxygen/AMReX__MLNodeTensorLap__2D__K_8H_source.html

#ifndef AMREX_MLNODETENSORLAP_2D_K_H_

#define AMREX_MLNODETENSORLAP_2D_K_H_

#include <AMReX_Config.H>


namespace amrex {


namespace mlndts_detail {


    AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE


    Real ts_interp_line_x (Array4<Real const> const& crse, int ic, int jc) noexcept

    {

        return (crse(ic,jc,0)+crse(ic+1,jc,0))*Real(0.5);

    }


    AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE


    Real ts_interp_line_y (Array4<Real const> const& crse, int ic, int jc) noexcept

    {

        return (crse(ic,jc,0)+crse(ic,jc+1,0))*Real(0.5);

    }


    AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE


    Real ts_interp_face_xy (Array4<Real const> const& crse, int ic, int jc) noexcept

    {

        return (ts_interp_line_y(crse,ic  ,jc  ) +

                ts_interp_line_y(crse,ic+1,jc  ) +

                ts_interp_line_x(crse,ic  ,jc  ) +

                ts_interp_line_x(crse,ic  ,jc+1)) * Real(0.25);

    }


}


AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE

void mlndtslap_interpadd (int i, int j, int, Array4<Real> const& fine,

                          Array4<Real const> const& crse, Array4<int const> const& msk) noexcept

{

    using namespace mlndts_detail;


    if (!msk(i,j,0)) {

        int ic = amrex::coarsen(i,2);

        int jc = amrex::coarsen(j,2);

        bool i_is_odd = (ic*2 != i);

        bool j_is_odd = (jc*2 != j);

        if (i_is_odd && j_is_odd) {

            // Node on a X-Y face

            fine(i,j,0) += ts_interp_face_xy(crse,ic,jc);

        } else if (i_is_odd) {

            // Node on X line

            fine(i,j,0) += ts_interp_line_x(crse,ic,jc);

        } else if (j_is_odd) {

            // Node on Y line

            fine(i,j,0) += ts_interp_line_y(crse,ic,jc);

        } else {

            // Node coincident with coarse node

            fine(i,j,0) += crse(ic,jc,0);

        }

    }

}


AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE

void mlndtslap_semi_interpadd (int i, int j, int, Array4<Real> const& fine,

                               Array4<Real const> const& crse, Array4<int const> const& msk,

                               int semi_dir) noexcept

{

    using namespace mlndts_detail;


    if (!msk(i,j,0)) {

        if (semi_dir == 0) {

            int jc = amrex::coarsen(j,2);

            bool j_is_odd = (jc*2 != j);

            if (j_is_odd) {

                // Node on Y line

                fine(i,j,0) += ts_interp_line_y(crse,i,jc);

            } else {

                // Node coincident with coarse node

                fine(i,j,0) += crse(i,jc,0);

            }

        } else {

            int ic = amrex::coarsen(i,2);

            bool i_is_odd = (ic*2 != i);

            if (i_is_odd) {

                // Node on X line

                fine(i,j,0) += ts_interp_line_x(crse,ic,j);

            } else {

                // Node coincident with coarse node

                fine(i,j,0) += crse(ic,j,0);

            }

        }

    }

}


AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE


void mlndtslap_adotx (int i, int j, int k, Array4<Real> const& y, Array4<Real const> const& x,

                      Array4<int const> const& msk, GpuArray<Real,3> const& s) noexcept

{

    if (msk(i,j,k)) {

        y(i,j,k) = Real(0.0);

    } else {

        y(i,j,k) = s[0] * (x(i-1,j,0) + x(i+1,j,0))

            +      s[2] * (x(i,j-1,0) + x(i,j+1,0))

            - Real(2.)*(s[0]+s[2]) * x(i,j,0)

            + Real(0.5)*s[1] * (x(i-1,j-1,0) + x(i+1,j+1,0) - x(i-1,j+1,0) - x(i+1,j-1,0));

    }

}


AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE


void mlndtslap_gauss_seidel (int i, int j, int k, Array4<Real> const& sol,

                             Array4<Real const> const& rhs, Array4<int const> const& msk,

                             GpuArray<Real,3> const& s) noexcept

{

    if (msk(i,j,k)) {

        sol(i,j,k) = 0.0;

    } else {

        constexpr Real omega = Real(1.25);

        Real s0 = Real(-2.)*(s[0]+s[2]);

        Real Ax = s[0] * (sol(i-1,j,0) + sol(i+1,j,0))

            +     s[2] * (sol(i,j-1,0) + sol(i,j+1,0))

            + s0 * sol(i,j,0)

            + Real(0.5)*s[1] * (sol(i-1,j-1,0) + sol(i+1,j+1,0) - sol(i-1,j+1,0) - sol(i+1,j-1,0));

        sol(i,j,k) += (rhs(i,j,k) - Ax) * (omega/s0);

    }

}


#if defined(AMREX_USE_HYPRE) && (AMREX_SPACEDIM > 1)


template <typename HypreInt, typename AtomicInt>

void mlndtslap_fill_ijmatrix_cpu (Box const& ndbx,

                                  Array4<AtomicInt const> const& gid,

                                  Array4<int const> const& lid,

                                  HypreInt* const ncols, HypreInt* const cols, Real* const mat, // NOLINT(readability-non-const-parameter)

                                  GpuArray<Real,3> const& s) noexcept

{

    constexpr auto gidmax = std::numeric_limits<AtomicInt>::max();

    HypreInt nelems = 0;

    amrex::LoopOnCpu(ndbx, [&] (int i, int j, int k) noexcept

    {

        if (lid(i,j,k) >= 0)

        {

            HypreInt nelems_old = nelems;


            cols[nelems] = gid(i,j,k);

            mat[nelems] = Real(-2.)*(s[0]+s[2]);

            ++nelems;


            if                (gid(i-1,j-1,k) < gidmax) {

                cols[nelems] = gid(i-1,j-1,k);

                mat[nelems] = Real(0.5)*s[1];

                ++nelems;

            }


            if                (gid(i,j-1,k) < gidmax) {

                cols[nelems] = gid(i,j-1,k);

                mat[nelems] = s[2];

                ++nelems;

            }


            if                (gid(i+1,j-1,k) < gidmax) {

                cols[nelems] = gid(i+1,j-1,k);

                mat[nelems] = Real(-0.5)*s[1];

                ++nelems;

            }


            if                (gid(i-1,j,k) < gidmax) {

                cols[nelems] = gid(i-1,j,k);

                mat[nelems] = s[0];

                ++nelems;

            }


            if                (gid(i+1,j,k) < gidmax) {

                cols[nelems] = gid(i+1,j,k);

                mat[nelems] = s[0];

                ++nelems;

            }


            if                (gid(i-1,j+1,k) < gidmax) {

                cols[nelems] = gid(i-1,j+1,k);

                mat[nelems] = Real(-0.5)*s[1];

                ++nelems;

            }


            if                (gid(i,j+1,k) < gidmax) {

                cols[nelems] = gid(i,j+1,k);

                mat[nelems] = s[2];

                ++nelems;

            }


            if                (gid(i+1,j+1,k) < gidmax) {

                cols[nelems] = gid(i+1,j+1,k);

                mat[nelems] = Real(0.5)*s[1];

                ++nelems;

            }


            ncols[lid(i,j,k)] = nelems - nelems_old;

        }

    });

}


#ifdef AMREX_USE_GPU

template <typename HypreInt, typename AtomicInt>

AMREX_GPU_DEVICE AMREX_FORCE_INLINE

void mlndtslap_fill_ijmatrix_gpu (const int ps, const int i, const int j, const int k,

                                  const int offset, Box const& ndbx,

                                  Array4<AtomicInt const> const& gid,

                                  Array4<int const> const& lid,

                                  HypreInt* const ncols, HypreInt* const cols, Real* const mat,

                                  GpuArray<Real,3> const& s) noexcept

{

    if (lid(i,j,k) >= 0)

    {

        constexpr auto gidmax = std::numeric_limits<AtomicInt>::max();


        if (offset == 0) {

            cols[ps] = gid(i,j,k);

            mat[ps] = Real(-2.)*(s[0]+s[2]);

            int nc = 1;

            if (gid(i-1,j-1,k) < gidmax) { ++nc; }

            if (gid(i  ,j-1,k) < gidmax) { ++nc; }

            if (gid(i+1,j-1,k) < gidmax) { ++nc; }

            if (gid(i-1,j  ,k) < gidmax) { ++nc; }

            if (gid(i+1,j  ,k) < gidmax) { ++nc; }

            if (gid(i-1,j+1,k) < gidmax) { ++nc; }

            if (gid(i  ,j+1,k) < gidmax) { ++nc; }

            if (gid(i+1,j+1,k) < gidmax) { ++nc; }

            ncols[lid(i,j,k)] = nc;

        }

        else if (offset == 1 && gid(i-1,j-1,k) < gidmax) {

            cols[ps] =          gid(i-1,j-1,k);

            mat[ps] = Real(0.5)*s[1];

        }

        else if (offset == 2 && gid(i  ,j-1,k) < gidmax) {

            cols[ps] =          gid(i  ,j-1,k);

            mat[ps] = s[2];

        }

        else if (offset == 3 && gid(i+1,j-1,k) < gidmax) {

            cols[ps] =          gid(i+1,j-1,k);

            mat[ps] = Real(-0.5)*s[1];

        }

        else if (offset == 4 && gid(i-1,j  ,k) < gidmax) {

            cols[ps] =          gid(i-1,j  ,k);

            mat[ps] = s[0];

        }

        else if (offset == 5 && gid(i+1,j  ,k) < gidmax) {

            cols[ps] =          gid(i+1,j  ,k);

            mat[ps] = s[0];

        }

        else if (offset == 6 && gid(i-1,j+1,k) < gidmax) {

            cols[ps] =          gid(i-1,j+1,k);

            mat[ps] = Real(-0.5)*s[1];

        }

        else if (offset == 7 && gid(i  ,j+1,k) < gidmax) {

            cols[ps] =          gid(i  ,j+1,k);

            mat[ps] = s[2];

        }

        else if (offset == 8 && gid(i+1,j+1,k) < gidmax) {

            cols[ps] =          gid(i+1,j+1,k);

            mat[ps] = Real(0.5)*s[1];

        }

    }

}

#endif


#endif


}


#endif

AMREX_FORCE_INLINE
#define AMREX_FORCE_INLINE
Definition AMReX_Extension.H:119

AMREX_GPU_DEVICE
#define AMREX_GPU_DEVICE
Definition AMReX_GpuQualifiers.H:18

AMREX_GPU_HOST_DEVICE
#define AMREX_GPU_HOST_DEVICE
Definition AMReX_GpuQualifiers.H:20

offset
Array4< int const  > offset
Definition AMReX_HypreMLABecLap.cpp:1089

fine
Array4< Real > fine
Definition AMReX_InterpFaceRegister.cpp:90

crse
Array4< Real const  > crse
Definition AMReX_InterpFaceRegister.cpp:92

amrex::mlndts_detail::ts_interp_line_x
AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE Real ts_interp_line_x(Array4< Real const > const &crse, int ic, int jc) noexcept
Definition AMReX_MLNodeTensorLap_2D_K.H:10

amrex::mlndts_detail::ts_interp_line_y
AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE Real ts_interp_line_y(Array4< Real const > const &crse, int ic, int jc) noexcept
Definition AMReX_MLNodeTensorLap_2D_K.H:16

amrex::mlndts_detail::ts_interp_face_xy
AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE Real ts_interp_face_xy(Array4< Real const > const &crse, int ic, int jc) noexcept
Definition AMReX_MLNodeTensorLap_2D_K.H:22

amrex
Definition AMReX_Amr.cpp:49

amrex::LoopOnCpu
AMREX_ATTRIBUTE_FLATTEN_FOR void LoopOnCpu(Dim3 lo, Dim3 hi, F const &f) noexcept
Definition AMReX_Loop.H:355

amrex::Box
BoxND< AMREX_SPACEDIM > Box
Definition AMReX_BaseFwd.H:27

amrex::CurlCurlStateType::x
@ x

amrex::mlndtslap_adotx
AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE void mlndtslap_adotx(int i, int j, int k, Array4< Real > const &y, Array4< Real const > const &x, Array4< int const > const &msk, GpuArray< Real, 3 > const &s) noexcept
Definition AMReX_MLNodeTensorLap_2D_K.H:91

amrex::mlndtslap_gauss_seidel
AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE void mlndtslap_gauss_seidel(int i, int j, int k, Array4< Real > const &sol, Array4< Real const > const &rhs, Array4< int const > const &msk, GpuArray< Real, 3 > const &s) noexcept
Definition AMReX_MLNodeTensorLap_2D_K.H:105

amrex::coarsen
AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE BoxND< dim > coarsen(const BoxND< dim > &b, int ref_ratio) noexcept
Coarsen BoxND by given (positive) refinement ratio. NOTE: if type(dir) = CELL centered: lo <- lo/rati...
Definition AMReX_Box.H:1304

amrex::mlndtslap_semi_interpadd
AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE void mlndtslap_semi_interpadd(int, int, int, Array4< Real > const &, Array4< Real const > const &, Array4< int const > const &, int) noexcept
Definition AMReX_MLNodeTensorLap_1D_K.H:13

amrex::mlndtslap_interpadd
AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE void mlndtslap_interpadd(int, int, int, Array4< Real > const &, Array4< Real const > const &, Array4< int const > const &) noexcept
Definition AMReX_MLNodeTensorLap_1D_K.H:8

amrex::Array4
Definition AMReX_Array4.H:61

amrex::GpuArray
Definition AMReX_Array.H:34