docs_html/doxygen/AMReX__FabArrayUtility_8H_source.html

#ifndef AMREX_FABARRAY_UTILITY_H_

#define AMREX_FABARRAY_UTILITY_H_

#include <AMReX_Config.H>


#include <AMReX_Concepts.H>

#include <AMReX_FabArray.H>

#include <AMReX_LayoutData.H>

#include <AMReX_Print.H>

#include <AMReX_ParReduce.H>

#include <limits>


namespace amrex {


template <BaseFabType FAB, class F>

typename FAB::value_type


ReduceSum (FabArray<FAB> const& fa, int nghost, F&& f)

{

    return ReduceSum(fa, IntVect(nghost), std::forward<F>(f));

}


namespace fudetail {

template <BaseFabType FAB, class F>

typename FAB::value_type

ReduceSum_host (FabArray<FAB> const& fa, IntVect const& nghost, F const& f)

{

    using value_type = typename FAB::value_type;

    value_type sm = 0;


#ifdef AMREX_USE_OMP

#pragma omp parallel if (!system::regtest_reduction) reduction(+:sm)

#endif

    for (MFIter mfi(fa,true); mfi.isValid(); ++mfi)

    {

        const Box& bx = mfi.growntilebox(nghost);

        auto const& arr = fa.const_array(mfi);

        sm += f(bx, arr);

    }


    return sm;

}

}


#ifdef AMREX_USE_GPU

namespace fudetail {

template <class OP, BaseFabType FAB, class F>

std::conditional_t<std::is_same_v<OP,ReduceOpLogicalAnd> ||

                   std::is_same_v<OP,ReduceOpLogicalOr>,

                   int, typename FAB::value_type>

ReduceMF (FabArray<FAB> const& fa, IntVect const& nghost, F const& f)

{

    using T = std::conditional_t<std::is_same_v<OP,ReduceOpLogicalAnd> ||

                                 std::is_same_v<OP,ReduceOpLogicalOr>,

                                 int, typename FAB::value_type>;

    auto typ = fa.ixType();

    auto const& ma = fa.const_arrays();

    return ParReduce(TypeList<OP>{}, TypeList<T>{}, fa, nghost,

           [=] AMREX_GPU_DEVICE (int box_no, int i, int j, int k) noexcept -> GpuTuple<T>

           {

               return { static_cast<T>(f(amrex::makeSingleCellBox(i,j,k,typ), ma[box_no])) };

           });

}


template <class OP, BaseFabType FAB1, BaseFabType FAB2, class F>

std::conditional_t<std::is_same_v<OP,ReduceOpLogicalAnd> ||

                   std::is_same_v<OP,ReduceOpLogicalOr>,

                   int, typename FAB1::value_type>

ReduceMF (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2, IntVect const& nghost, F const& f)

{

    using T = std::conditional_t<std::is_same_v<OP,ReduceOpLogicalAnd> ||

                                 std::is_same_v<OP,ReduceOpLogicalOr>,

                                 int, typename FAB1::value_type>;

    auto typ = fa1.ixType();

    auto const& ma1 = fa1.const_arrays();

    auto const& ma2 = fa2.const_arrays();

    return ParReduce(TypeList<OP>{}, TypeList<T>{}, fa1, nghost,

           [=] AMREX_GPU_DEVICE (int box_no, int i, int j, int k) noexcept -> GpuTuple<T>

           {

               return { static_cast<T>(f(amrex::makeSingleCellBox(i,j,k,typ),

                                         ma1[box_no], ma2[box_no])) };

           });

}


template <class OP, BaseFabType FAB1, BaseFabType FAB2, BaseFabType FAB3, class F>

std::conditional_t<std::is_same_v<OP,ReduceOpLogicalAnd> ||

                   std::is_same_v<OP,ReduceOpLogicalOr>,

                   int, typename FAB1::value_type>

ReduceMF (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

          FabArray<FAB3> const& fa3, IntVect const& nghost, F const& f)

{

    using T = std::conditional_t<std::is_same_v<OP,ReduceOpLogicalAnd> ||

                                 std::is_same_v<OP,ReduceOpLogicalOr>,

                                 int, typename FAB1::value_type>;

    auto typ = fa1.ixType();

    auto const& ma1 = fa1.const_arrays();

    auto const& ma2 = fa2.const_arrays();

    auto const& ma3 = fa3.const_arrays();

    return ParReduce(TypeList<OP>{}, TypeList<T>{}, fa1, nghost,

           [=] AMREX_GPU_DEVICE (int box_no, int i, int j, int k) noexcept -> GpuTuple<T>

           {

               return { static_cast<T>(f(amrex::makeSingleCellBox(i,j,k,typ),

                                         ma1[box_no], ma2[box_no], ma3[box_no])) };

           });

}


template <BaseFabType FAB, class F>

requires (!amrex::DefinitelyNotHostRunnable<F>::value)

typename FAB::value_type ReduceSum_host_wrapper (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)

{

    return ReduceSum_host(fa,nghost,std::forward<F>(f));

}


template <BaseFabType FAB, class F>

requires (amrex::DefinitelyNotHostRunnable<F>::value)

typename FAB::value_type ReduceSum_host_wrapper (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)

{

    amrex::ignore_unused(fa,nghost,f);

    amrex::Abort("ReduceSum: Launch Region is off. Device lambda cannot be called by host.");

    return 0;

}

}


template <BaseFabType FAB, class F>

typename FAB::value_type


ReduceSum (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)

{

    if (Gpu::inLaunchRegion()) {

        return fudetail::ReduceMF<ReduceOpSum>(fa, nghost, std::forward<F>(f));

    } else {

        return fudetail::ReduceSum_host_wrapper(fa, nghost, std::forward<F>(f));

    }

}


#else

template <BaseFabType FAB, class F>

typename FAB::value_type

ReduceSum (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)

{

    return fudetail::ReduceSum_host(fa, nghost, std::forward<F>(f));

}

#endif


template <BaseFabType FAB1, BaseFabType FAB2, class F>

typename FAB1::value_type


ReduceSum (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

           int nghost, F&& f)

{

    return ReduceSum(fa1, fa2, IntVect(nghost), std::forward<F>(f));

}


namespace fudetail {

template <BaseFabType FAB1, BaseFabType FAB2, class F>

typename FAB1::value_type

ReduceSum_host (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

                IntVect const& nghost, F const& f)

{

    using value_type = typename FAB1::value_type;

    value_type sm = 0;


#ifdef AMREX_USE_OMP

#pragma omp parallel if (!system::regtest_reduction) reduction(+:sm)

#endif

    for (MFIter mfi(fa1,true); mfi.isValid(); ++mfi)

    {

        const Box& bx = mfi.growntilebox(nghost);

        const auto& arr1 = fa1.const_array(mfi);

        const auto& arr2 = fa2.const_array(mfi);

        sm += f(bx, arr1, arr2);

    }


    return sm;

}

}


#ifdef AMREX_USE_GPU

namespace fudetail {

template <BaseFabType FAB1, BaseFabType FAB2, class F>

requires (!amrex::DefinitelyNotHostRunnable<F>::value)

typename FAB1::value_type ReduceSum_host_wrapper (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

                        IntVect const& nghost, F&& f)

{

    return ReduceSum_host(fa1,fa2,nghost,std::forward<F>(f));

}


template <BaseFabType FAB1, BaseFabType FAB2, class F>

requires (amrex::DefinitelyNotHostRunnable<F>::value)

typename FAB1::value_type ReduceSum_host_wrapper (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

                        IntVect const& nghost, F&& f)

{

    amrex::ignore_unused(fa1,fa2,nghost,f);

    amrex::Abort("ReduceSum: Launch Region is off. Device lambda cannot be called by host.");

    return 0;

}

}


template <BaseFabType FAB1, BaseFabType FAB2, class F>

typename FAB1::value_type


ReduceSum (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

           IntVect const& nghost, F&& f)

{

    if (Gpu::inLaunchRegion()) {

        return fudetail::ReduceMF<ReduceOpSum>(fa1,fa2,nghost,std::forward<F>(f));

    } else {

        return fudetail::ReduceSum_host_wrapper(fa1,fa2,nghost, std::forward<F>(f));

    }

}


#else

template <BaseFabType FAB1, BaseFabType FAB2, class F>

typename FAB1::value_type

ReduceSum (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

           IntVect const& nghost, F&& f)

{

    return fudetail::ReduceSum_host(fa1,fa2,nghost,std::forward<F>(f));

}

#endif


template <BaseFabType FAB1, BaseFabType FAB2, BaseFabType FAB3, class F>

typename FAB1::value_type


ReduceSum (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2, FabArray<FAB3> const& fa3,

           int nghost, F&& f)

{

  return ReduceSum(fa1, fa2, fa3, IntVect(nghost), std::forward<F>(f));

}


namespace fudetail {

template <BaseFabType FAB1, BaseFabType FAB2, BaseFabType FAB3, class F>

typename FAB1::value_type

ReduceSum_host (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

                FabArray<FAB3> const& fa3, IntVect const& nghost, F const& f)

{

    using value_type = typename FAB1::value_type;

    value_type sm = 0;


#ifdef AMREX_USE_OMP

#pragma omp parallel if (!system::regtest_reduction) reduction(+:sm)

#endif

    for (MFIter mfi(fa1,true); mfi.isValid(); ++mfi)

    {

        const Box& bx = mfi.growntilebox(nghost);

        const auto& arr1 = fa1.const_array(mfi);

        const auto& arr2 = fa2.const_array(mfi);

        const auto& arr3 = fa3.const_array(mfi);

        sm += f(bx, arr1, arr2, arr3);

    }


    return sm;

}

}


#ifdef AMREX_USE_GPU

namespace fudetail {

template <BaseFabType FAB1, BaseFabType FAB2, BaseFabType FAB3, class F>

requires (!amrex::DefinitelyNotHostRunnable<F>::value)

typename FAB1::value_type ReduceSum_host_wrapper (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

                        FabArray<FAB3> const& fa3, IntVect const& nghost, F&& f)

{

    return fudetail::ReduceSum_host(fa1,fa2,fa3,nghost,std::forward<F>(f));

}


template <BaseFabType FAB1, BaseFabType FAB2, BaseFabType FAB3, class F>

requires (amrex::DefinitelyNotHostRunnable<F>::value)

typename FAB1::value_type ReduceSum_host_wrapper (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

                        FabArray<FAB3> const& fa3, IntVect const& nghost, F&& f)

{

    amrex::ignore_unused(fa1,fa2,fa3,nghost,f);

    amrex::Abort("ReduceSum: Launch Region is off. Device lambda cannot be called by host.");

    return 0;

}

}


template <BaseFabType FAB1, BaseFabType FAB2, BaseFabType FAB3, class F>

typename FAB1::value_type


ReduceSum (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

           FabArray<FAB3> const& fa3, IntVect const& nghost, F&& f)

{

    if (Gpu::inLaunchRegion()) {

        return fudetail::ReduceMF<ReduceOpSum>(fa1,fa2,fa3,nghost,std::forward<F>(f));

    } else {

        return fudetail::ReduceSum_host_wrapper(fa1,fa2,fa3,nghost,std::forward<F>(f));

    }

}


#else

template <BaseFabType FAB1, BaseFabType FAB2, BaseFabType FAB3, class F>

typename FAB1::value_type

ReduceSum (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

           FabArray<FAB3> const& fa3, IntVect const& nghost, F&& f)

{

    return fudetail::ReduceSum_host(fa1,fa2,fa3,nghost,std::forward<F>(f));

}

#endif


template <BaseFabType FAB, class F>

typename FAB::value_type


ReduceMin (FabArray<FAB> const& fa, int nghost, F&& f)

{

    return ReduceMin(fa, IntVect(nghost), std::forward<F>(f));

}


namespace fudetail {

template <BaseFabType FAB, class F>

typename FAB::value_type

ReduceMin_host (FabArray<FAB> const& fa, IntVect const& nghost, F const& f)

{

    using value_type = typename FAB::value_type;

    value_type r = std::numeric_limits<value_type>::max();


#ifdef AMREX_USE_OMP

#pragma omp parallel reduction(min:r)

#endif

    for (MFIter mfi(fa,true); mfi.isValid(); ++mfi)

    {

        const Box& bx = mfi.growntilebox(nghost);

        const auto& arr = fa.const_array(mfi);

        r = std::min(r, f(bx, arr));

    }

    return r;

}

}


#ifdef AMREX_USE_GPU

namespace fudetail {

template <BaseFabType FAB, class F>

requires (!amrex::DefinitelyNotHostRunnable<F>::value)

typename FAB::value_type ReduceMin_host_wrapper (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)

{

    return ReduceMin_host(fa,nghost,std::forward<F>(f));

}


template <BaseFabType FAB, class F>

requires (amrex::DefinitelyNotHostRunnable<F>::value)

typename FAB::value_type ReduceMin_host_wrapper (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)

{

    amrex::ignore_unused(fa,nghost,f);

    amrex::Abort("ReduceMin: Launch Region is off. Device lambda cannot be called by host.");

    return 0;

}

}


template <BaseFabType FAB, class F>

typename FAB::value_type


ReduceMin (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)

{

    if (Gpu::inLaunchRegion()) {

        return fudetail::ReduceMF<ReduceOpMin>(fa, nghost, std::forward<F>(f));

    } else {

        return fudetail::ReduceMin_host_wrapper(fa, nghost, std::forward<F>(f));

    }

}


#else

template <BaseFabType FAB, class F>

typename FAB::value_type

ReduceMin (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)

{

    return fudetail::ReduceMin_host(fa, nghost, std::forward<F>(f));

}

#endif


template <BaseFabType FAB1, BaseFabType FAB2, class F>

typename FAB1::value_type


ReduceMin (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2, int nghost, F&& f)

{

    return ReduceMin(fa1, fa2, IntVect(nghost), std::forward<F>(f));

}


namespace fudetail {

template <BaseFabType FAB1, BaseFabType FAB2, class F>

typename FAB1::value_type

ReduceMin_host (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

                IntVect const& nghost, F const& f)

{

    using value_type = typename FAB1::value_type;

    value_type r = std::numeric_limits<value_type>::max();


#ifdef AMREX_USE_OMP

#pragma omp parallel reduction(min:r)

#endif

    for (MFIter mfi(fa1,true); mfi.isValid(); ++mfi)

    {

        const Box& bx = mfi.growntilebox(nghost);

        const auto& arr1 = fa1.const_array(mfi);

        const auto& arr2 = fa2.const_array(mfi);

        r = std::min(r, f(bx, arr1, arr2));

    }


    return r;

}

}


#ifdef AMREX_USE_GPU

namespace fudetail {

template <BaseFabType FAB1, BaseFabType FAB2, class F>

requires (!amrex::DefinitelyNotHostRunnable<F>::value)

typename FAB1::value_type ReduceMin_host_wrapper (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

                        IntVect const& nghost, F&& f)

{

    return fudetail::ReduceMin_host(fa1,fa2,nghost,std::forward<F>(f));

}


template <BaseFabType FAB1, BaseFabType FAB2, class F>

requires (amrex::DefinitelyNotHostRunnable<F>::value)

typename FAB1::value_type ReduceMin_host_wrapper (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

                        IntVect const& nghost, F&& f)

{

    amrex::ignore_unused(fa1,fa2,nghost,f);

    amrex::Abort("ReduceMin: Launch Region is off. Device lambda cannot be called by host.");

    return 0;

}

}


template <BaseFabType FAB1, BaseFabType FAB2, class F>

typename FAB1::value_type


ReduceMin (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

           IntVect const& nghost, F&& f)

{

    if (Gpu::inLaunchRegion()) {

        return fudetail::ReduceMF<ReduceOpMin>(fa1,fa2,nghost,std::forward<F>(f));

    } else {

        return fudetail::ReduceMin_host_wrapper(fa1,fa2,nghost,std::forward<F>(f));

    }

}


#else

template <BaseFabType FAB1, BaseFabType FAB2, class F>

typename FAB1::value_type

ReduceMin (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

           IntVect const& nghost, F&& f)

{

    return fudetail::ReduceMin_host(fa1,fa2,nghost,std::forward<F>(f));

}

#endif


template <BaseFabType FAB1, BaseFabType FAB2, BaseFabType FAB3, class F>

typename FAB1::value_type


ReduceMin (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2, FabArray<FAB3> const& fa3,

           int nghost, F&& f)

{

    return ReduceMin(fa1, fa2, fa3, IntVect(nghost), std::forward<F>(f));

}


namespace fudetail {

template <BaseFabType FAB1, BaseFabType FAB2, BaseFabType FAB3, class F>

typename FAB1::value_type

ReduceMin_host (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

                FabArray<FAB3> const& fa3, IntVect const& nghost, F const& f)

{

    using value_type = typename FAB1::value_type;

    value_type r = std::numeric_limits<value_type>::max();


#ifdef AMREX_USE_OMP

#pragma omp parallel reduction(min:r)

#endif

    for (MFIter mfi(fa1,true); mfi.isValid(); ++mfi)

    {

        const Box& bx = mfi.growntilebox(nghost);

        const auto& arr1 = fa1.const_array(mfi);

        const auto& arr2 = fa2.const_array(mfi);

        const auto& arr3 = fa3.const_array(mfi);

        r = std::min(r, f(bx, arr1, arr2, arr3));

    }


    return r;

}

}


#ifdef AMREX_USE_GPU

namespace fudetail {

template <BaseFabType FAB1, BaseFabType FAB2, BaseFabType FAB3, class F>

requires (!amrex::DefinitelyNotHostRunnable<F>::value)

typename FAB1::value_type ReduceMin_host_wrapper (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

                        FabArray<FAB3> const& fa3, IntVect const& nghost, F&& f)

{

    return fudetail::ReduceMin_host(fa1,fa2,fa3,nghost,std::forward<F>(f));

}


template <BaseFabType FAB1, BaseFabType FAB2, BaseFabType FAB3, class F>

requires (amrex::DefinitelyNotHostRunnable<F>::value)

typename FAB1::value_type ReduceMin_host_wrapper (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

                        FabArray<FAB3> const& fa3, IntVect const& nghost, F&& f)

{

    amrex::ignore_unused(fa1,fa2,fa3,nghost,f);

    amrex::Abort("ReduceMin: Launch Region is off. Device lambda cannot be called by host.");

    return 0;

}

}


template <BaseFabType FAB1, BaseFabType FAB2, BaseFabType FAB3, class F>

typename FAB1::value_type


ReduceMin (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

           FabArray<FAB3> const& fa3, IntVect const& nghost, F&& f)

{

    if (Gpu::inLaunchRegion()) {

        return fudetail::ReduceMF<ReduceOpMin>(fa1,fa2,fa3,nghost,std::forward<F>(f));

    } else {

        return fudetail::ReduceMin_host_wrapper(fa1,fa2,fa3,nghost,std::forward<F>(f));

    }

}


#else

template <BaseFabType FAB1, BaseFabType FAB2, BaseFabType FAB3, class F>

typename FAB1::value_type

ReduceMin (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

           FabArray<FAB3> const& fa3, IntVect const& nghost, F&& f)

{

    return fudetail::ReduceMin_host(fa1,fa2,fa3,nghost,std::forward<F>(f));

}

#endif


template <BaseFabType FAB, class F>

typename FAB::value_type


ReduceMax (FabArray<FAB> const& fa, int nghost, F&& f)

{

    return ReduceMax(fa, IntVect(nghost), std::forward<F>(f));

}


namespace fudetail {

template <BaseFabType FAB, class F>

typename FAB::value_type

ReduceMax_host (FabArray<FAB> const& fa, IntVect const& nghost, F const& f)

{

    using value_type = typename FAB::value_type;

    value_type r = std::numeric_limits<value_type>::lowest();


#ifdef AMREX_USE_OMP

#pragma omp parallel reduction(max:r)

#endif

    for (MFIter mfi(fa,true); mfi.isValid(); ++mfi)

    {

        const Box& bx = mfi.growntilebox(nghost);

        const auto& arr = fa.const_array(mfi);

        r = std::max(r, f(bx, arr));

    }


    return r;

}

}


#ifdef AMREX_USE_GPU

namespace fudetail {

template <BaseFabType FAB, class F>

requires (!amrex::DefinitelyNotHostRunnable<F>::value)

typename FAB::value_type ReduceMax_host_wrapper (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)

{

    return ReduceMax_host(fa,nghost,std::forward<F>(f));

}


template <BaseFabType FAB, class F>

requires (amrex::DefinitelyNotHostRunnable<F>::value)

typename FAB::value_type ReduceMax_host_wrapper (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)

{

    amrex::ignore_unused(fa,nghost,f);

    amrex::Abort("ReduceMax: Launch Region is off. Device lambda cannot be called by host.");

    return 0;

}

}


template <BaseFabType FAB, class F>

typename FAB::value_type


ReduceMax (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)

{

    if (Gpu::inLaunchRegion()) {

        return fudetail::ReduceMF<ReduceOpMax>(fa,nghost,std::forward<F>(f));

    } else {

        return fudetail::ReduceMax_host_wrapper(fa,nghost,std::forward<F>(f));

    }

}


#else

template <BaseFabType FAB, class F>

typename FAB::value_type

ReduceMax (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)

{

    return fudetail::ReduceMax_host(fa,nghost,std::forward<F>(f));

}

#endif


template <BaseFabType FAB1, BaseFabType FAB2, class F>

typename FAB1::value_type


ReduceMax (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2, int nghost, F&& f)

{

    return ReduceMax(fa1, fa2, IntVect(nghost), std::forward<F>(f));

}


namespace fudetail {

template <BaseFabType FAB1, BaseFabType FAB2, class F>

typename FAB1::value_type

ReduceMax_host (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

                IntVect const& nghost, F const& f)

{

    using value_type = typename FAB1::value_type;

    value_type r = std::numeric_limits<value_type>::lowest();


#ifdef AMREX_USE_OMP

#pragma omp parallel reduction(max:r)

#endif

    for (MFIter mfi(fa1,true); mfi.isValid(); ++mfi)

    {

        const Box& bx = mfi.growntilebox(nghost);

        const auto& arr1 = fa1.const_array(mfi);

        const auto& arr2 = fa2.const_array(mfi);

        r = std::max(r, f(bx, arr1, arr2));

    }


    return r;

}

}


#ifdef AMREX_USE_GPU

namespace fudetail {

template <BaseFabType FAB1, BaseFabType FAB2, class F>

requires (!amrex::DefinitelyNotHostRunnable<F>::value)

typename FAB1::value_type ReduceMax_host_wrapper (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

                        IntVect const& nghost, F&& f)

{

    return ReduceMax_host(fa1,fa2,nghost,std::forward<F>(f));

}


template <BaseFabType FAB1, BaseFabType FAB2, class F>

requires (amrex::DefinitelyNotHostRunnable<F>::value)

typename FAB1::value_type ReduceMax_host_wrapper (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

                        IntVect const& nghost, F&& f)

{

    amrex::ignore_unused(fa1,fa2,nghost,f);

    amrex::Abort("ReduceMax: Launch Region is off. Device lambda cannot be called by host.");

    return 0;

}

}


template <BaseFabType FAB1, BaseFabType FAB2, class F>

typename FAB1::value_type


ReduceMax (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

           IntVect const& nghost, F&& f)

{

    if (Gpu::inLaunchRegion()) {

        return fudetail::ReduceMF<ReduceOpMax>(fa1,fa2,nghost,std::forward<F>(f));

    } else {

        return fudetail::ReduceMax_host_wrapper(fa1,fa2,nghost,std::forward<F>(f));

    }

}


#else

template <BaseFabType FAB1, BaseFabType FAB2, class F>

typename FAB1::value_type

ReduceMax (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

           IntVect const& nghost, F&& f)

{

    return fudetail::ReduceMax_host(fa1,fa2,nghost,std::forward<F>(f));

}

#endif


template <BaseFabType FAB1, BaseFabType FAB2, BaseFabType FAB3, class F>

typename FAB1::value_type


ReduceMax (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2, FabArray<FAB3> const& fa3,

           int nghost, F&& f)

{

    return ReduceMax(fa1, fa2, fa3, IntVect(nghost), std::forward<F>(f));

}


namespace fudetail {

template <BaseFabType FAB1, BaseFabType FAB2, BaseFabType FAB3, class F>

typename FAB1::value_type

ReduceMax_host (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

                FabArray<FAB3> const& fa3, IntVect const& nghost, F const& f)

{

    using value_type = typename FAB1::value_type;

    value_type r = std::numeric_limits<value_type>::lowest();


#ifdef AMREX_USE_OMP

#pragma omp parallel reduction(max:r)

#endif

    for (MFIter mfi(fa1,true); mfi.isValid(); ++mfi)

    {

        const Box& bx = mfi.growntilebox(nghost);

        const auto& arr1 = fa1.const_array(mfi);

        const auto& arr2 = fa2.const_array(mfi);

        const auto& arr3 = fa3.const_array(mfi);

        r = std::max(r, f(bx, arr1, arr2, arr3));

    }


    return r;

}

}


#ifdef AMREX_USE_GPU

namespace fudetail {

template <BaseFabType FAB1, BaseFabType FAB2, BaseFabType FAB3, class F>

requires (!amrex::DefinitelyNotHostRunnable<F>::value)

typename FAB1::value_type ReduceMax_host_wrapper (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

                        FabArray<FAB3> const& fa3, IntVect const& nghost, F&& f)

{

    return fudetail::ReduceMax_host(fa1,fa2,fa3,nghost,std::forward<F>(f));

}


template <BaseFabType FAB1, BaseFabType FAB2, BaseFabType FAB3, class F>

requires (amrex::DefinitelyNotHostRunnable<F>::value)

typename FAB1::value_type ReduceMax_host_wrapper (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

                        FabArray<FAB3> const& fa3, IntVect const& nghost, F&& f)

{

    amrex::ignore_unused(fa1,fa2,fa3,nghost,f);

    amrex::Abort("ReduceMax: Launch Region is off. Device lambda cannot be called by host.");

    return 0;

}

}


template <BaseFabType FAB1, BaseFabType FAB2, BaseFabType FAB3, class F>

typename FAB1::value_type


ReduceMax (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

           FabArray<FAB3> const& fa3, IntVect const& nghost, F&& f)

{

    if (Gpu::inLaunchRegion()) {

        return fudetail::ReduceMF<ReduceOpMax>(fa1,fa2,fa3,nghost,std::forward<F>(f));

    } else {

        return fudetail::ReduceMax_host_wrapper(fa1,fa2,fa3,nghost,std::forward<F>(f));

    }

}


#else

template <BaseFabType FAB1, BaseFabType FAB2, BaseFabType FAB3, class F>

typename FAB1::value_type

ReduceMax (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

           FabArray<FAB3> const& fa3, IntVect const& nghost, F&& f)

{

    return fudetail::ReduceMax_host(fa1,fa2,fa3,nghost,std::forward<F>(f));

}

#endif


template <BaseFabType FAB, class F>

bool


ReduceLogicalAnd (FabArray<FAB> const& fa, int nghost, F&& f)

{

    return ReduceLogicalAnd(fa, IntVect(nghost), std::forward<F>(f));

}


namespace fudetail {

template <BaseFabType FAB, class F>

bool

ReduceLogicalAnd_host (FabArray<FAB> const& fa, IntVect const& nghost, F const& f)

{

    int r = true;


#ifdef AMREX_USE_OMP

#pragma omp parallel reduction(&&:r)

#endif

    for (MFIter mfi(fa,true); mfi.isValid(); ++mfi)

    {

        const Box& bx = mfi.growntilebox(nghost);

        const auto& arr = fa.const_array(mfi);

        r = r && f(bx, arr);

    }


    return r;

}

}


#ifdef AMREX_USE_GPU

namespace fudetail {

template <BaseFabType FAB, class F>

requires (!amrex::DefinitelyNotHostRunnable<F>::value)

bool ReduceLogicalAnd_host_wrapper (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)

{

    return ReduceLogicalAnd_host(fa,nghost,std::forward<F>(f));

}


template <BaseFabType FAB, class F>

requires (amrex::DefinitelyNotHostRunnable<F>::value)

bool ReduceLogicalAnd_host_wrapper (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)

{

    amrex::ignore_unused(fa,nghost,f);

    amrex::Abort("ReduceLogicalAnd: Launch Region is off. Device lambda cannot be called by host.");

    return false;

}

}


template <BaseFabType FAB, class F>

bool


ReduceLogicalAnd (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)

{

    if (Gpu::inLaunchRegion()) {

        return fudetail::ReduceMF<ReduceOpLogicalAnd>(fa,nghost,std::forward<F>(f));

    } else {

        return fudetail::ReduceLogicalAnd_host_wrapper(fa,nghost,std::forward<F>(f));

    }

}


#else

template <BaseFabType FAB, class F>

bool

ReduceLogicalAnd (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)

{

    return fudetail::ReduceLogicalAnd_host(fa,nghost,std::forward<F>(f));

}

#endif


template <BaseFabType FAB1, BaseFabType FAB2, class F>

bool


ReduceLogicalAnd (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

                  int nghost, F&& f)

{

    return ReduceLogicalAnd(fa1, fa2, IntVect(nghost), std::forward<F>(f));

}


namespace fudetail {

template <BaseFabType FAB1, BaseFabType FAB2, class F>

bool

ReduceLogicalAnd_host (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

                       IntVect const& nghost, F const& f)

{

    int r = true;


#ifdef AMREX_USE_OMP

#pragma omp parallel reduction(&&:r)

#endif

    for (MFIter mfi(fa1,true); mfi.isValid(); ++mfi)

    {

        const Box& bx = mfi.growntilebox(nghost);

        const auto& arr1 = fa1.const_array(mfi);

        const auto& arr2 = fa2.const_array(mfi);

        r = r && f(bx, arr1, arr2);

    }


    return r;

}

}


#ifdef AMREX_USE_GPU

namespace fudetail {

template <BaseFabType FAB1, BaseFabType FAB2, class F>

requires (!amrex::DefinitelyNotHostRunnable<F>::value)

bool ReduceLogicalAnd_host_wrapper (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

                  IntVect const& nghost, F&& f)

{

    return ReduceLogicalAnd_host(fa1,fa2,nghost,std::forward<F>(f));

}


template <BaseFabType FAB1, BaseFabType FAB2, class F>

requires (amrex::DefinitelyNotHostRunnable<F>::value)

bool ReduceLogicalAnd_host_wrapper (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

                               IntVect const& nghost, F&& f)

{

    amrex::ignore_unused(fa1,fa2,nghost,f);

    amrex::Abort("ReduceLogicalAnd: Luanch Region is off. Device lambda cannot be called by host.");

    return false;

}

}


template <BaseFabType FAB1, BaseFabType FAB2, class F>

bool


ReduceLogicalAnd (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

                  IntVect const& nghost, F&& f)

{

    if (Gpu::inLaunchRegion()) {

        return fudetail::ReduceMF<ReduceOpLogicalAnd>(fa1,fa2,nghost,std::forward<F>(f));

    } else {

        return fudetail::ReduceLogicalAnd_host_wrapper(fa1,fa2,nghost,std::forward<F>(f));

    }

}


#else

template <BaseFabType FAB1, BaseFabType FAB2, class F>

bool

ReduceLogicalAnd (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

                  IntVect const& nghost, F&& f)

{

    return fudetail::ReduceLogicalAnd_host(fa1,fa2,nghost,std::forward<F>(f));

}

#endif


template <BaseFabType FAB, class F>

bool


ReduceLogicalOr (FabArray<FAB> const& fa, int nghost, F&& f)

{

    return ReduceLogicalOr(fa, IntVect(nghost), std::forward<F>(f));

}


namespace fudetail {

template <BaseFabType FAB, class F>

bool

ReduceLogicalOr_host (FabArray<FAB> const& fa, IntVect const& nghost, F const& f)

{

    int r = false;


#ifdef AMREX_USE_OMP

#pragma omp parallel reduction(||:r)

#endif

    for (MFIter mfi(fa,true); mfi.isValid(); ++mfi)

    {

        const Box& bx = mfi.growntilebox(nghost);

        const auto& arr = fa.const_array(mfi);

        r = r || f(bx, arr);

    }


    return r;

}

}


#ifdef AMREX_USE_GPU

namespace fudetail {

template <BaseFabType FAB, class F>

requires (!amrex::DefinitelyNotHostRunnable<F>::value)

bool ReduceLogicalOr_host_wrapper (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)

{

    return ReduceLogicalOr_host(fa,nghost,std::forward<F>(f));

}


template <BaseFabType FAB, class F>

requires (amrex::DefinitelyNotHostRunnable<F>::value)

bool ReduceLogicalOr_host (FabArray<FAB> const& fa, IntVect const& nghost, F&& /*f*/)

{

    amrex::ignore_unused(fa,nghost);

    amrex::Abort("ReduceLogicalOr: Launch Region is off. Device lambda cannot be called by host.");

    return 0;

}

}


template <BaseFabType FAB, class F>

bool


ReduceLogicalOr (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)

{

    if (Gpu::inLaunchRegion()) {

        return fudetail::ReduceMF<ReduceOpLogicalOr>(fa,nghost,std::forward<F>(f));

    } else {

        return fudetail::ReduceLogicalOr_host_wrapper(fa,nghost,std::forward<F>(f));

    }

}


#else

template <BaseFabType FAB, class F>

bool

ReduceLogicalOr (FabArray<FAB> const& fa, IntVect const& nghost, F&& f)

{

    return fudetail::ReduceLogicalOr_host(fa,nghost,std::forward<F>(f));

}

#endif


template <BaseFabType FAB1, BaseFabType FAB2, class F>

bool


ReduceLogicalOr (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

                 int nghost, F&& f)

{

    return ReduceLogicalOr(fa1, fa2, IntVect(nghost), std::forward<F>(f));

}


namespace fudetail {

template <BaseFabType FAB1, BaseFabType FAB2, class F>

bool

ReduceLogicalOr_host (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

                      IntVect const& nghost, F const& f)

{

    int r = false;


#ifdef AMREX_USE_OMP

#pragma omp parallel reduction(||:r)

#endif

    for (MFIter mfi(fa1,true); mfi.isValid(); ++mfi)

    {

        const Box& bx = mfi.growntilebox(nghost);

        const auto& arr1 = fa1.const_array(mfi);

        const auto& arr2 = fa2.const_array(mfi);

        r = r || f(bx, arr1, arr2);

    }


    return r;

}

}


#ifdef AMREX_USE_GPU

namespace fudetail {

template <BaseFabType FAB1, BaseFabType FAB2, class F>

requires (!amrex::DefinitelyNotHostRunnable<F>::value)

bool ReduceLogicalOr_host_wrapper (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

                 IntVect const& nghost, F&& f)

{

    return fudetail::ReduceLogicalOr_host(fa1,fa2,nghost,std::forward<F>(f));

}


template <BaseFabType FAB1, BaseFabType FAB2, class F>

requires (amrex::DefinitelyNotHostRunnable<F>::value)

bool ReduceLogicalOr_host_wrapper (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

                              IntVect const& nghost, F&& f)

{

    amrex::ignore_unused(fa1,fa2,nghost,f);

    amrex::Abort("ReeuceLogicalOr: Launch Region is off. Device lambda cannot be called by host.");

    return false;

}

}


template <BaseFabType FAB1, BaseFabType FAB2, class F>

bool


ReduceLogicalOr (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

                 IntVect const& nghost, F&& f)

{

    if (Gpu::inLaunchRegion()) {

        return fudetail::ReduceMF<ReduceOpLogicalOr>(fa1,fa2,nghost,std::forward<F>(f));

    } else {

        return fudetail::ReduceLogicalOr_host_wrapper(fa1,fa2,nghost,std::forward<F>(f));

    }

}


#else

template <BaseFabType FAB1, BaseFabType FAB2, class F>

bool

ReduceLogicalOr (FabArray<FAB1> const& fa1, FabArray<FAB2> const& fa2,

                 IntVect const& nghost, F&& f)

{

    return fudetail::ReduceLogicalOr_host(fa1,fa2,nghost,std::forward<F>(f));

}

#endif


template <BaseFabType FAB>

void


printCell (FabArray<FAB> const& mf, const IntVect& cell, int comp = -1,

           const IntVect& ng = IntVect::TheZeroVector())

{

    for (MFIter mfi(mf); mfi.isValid(); ++mfi)

    {

        const Box& bx = amrex::grow(mfi.validbox(), ng);

        if (bx.contains(cell)) {

            int n = (comp >= 0) ? 1 : mf.nComp();

            auto const& fab = mf.const_array(mfi);

            Gpu::PinnedVector<typename FAB::value_type> pv(n);

            auto* dp = pv.data();

            auto f = [=] AMREX_GPU_HOST_DEVICE ()

                {

                    if (comp >= 0) {

                        *dp = fab(cell, comp);

                    } else {

                        for (int i = 0; i < n; ++i) {

                            dp[i] = fab(cell,i);

                        }

                    }

                };


#ifdef AMREX_USE_GPU

            if (mf.arena()->isManaged() || mf.arena()->isDevice()) {

                amrex::single_task(f);

                Gpu::streamSynchronize();

            } else

#endif

            {

                f();

            }


            if (comp >= 0) {

                amrex::AllPrint().SetPrecision(17) << " At cell " << cell << " in Box " << bx

                                                   << ": " << *dp << '\n';

            } else {

                std::ostringstream ss;

                ss.precision(17);

                for (int i = 0; i < n-1; ++i)

                {

                    ss << dp[i] << ", ";

                }

                ss << dp[n-1];

                amrex::AllPrint() << " At cell " << cell << " in Box " << bx

                                  << ": " << ss.view() << '\n';

            }

        }

    }

}


template <BaseFabType FAB>

void


Swap (FabArray<FAB>& dst, FabArray<FAB>& src, int srccomp, int dstcomp, int numcomp, int nghost)

{

    Swap(dst,src,srccomp,dstcomp,numcomp,IntVect(nghost));

}


template <BaseFabType FAB>

void


Swap (FabArray<FAB>& dst, FabArray<FAB>& src, int srccomp, int dstcomp, int numcomp, const IntVect& nghost)

{

    // We can take a shortcut and do a std::swap if we're swapping all of the data

    // and they are allocated in the same Arena.


    bool explicit_swap = true;


    if (srccomp == dstcomp && dstcomp == 0 && src.nComp() == dst.nComp() &&

        src.nGrowVect() == nghost && src.nGrowVect() == dst.nGrowVect() &&

        src.arena() == dst.arena() && src.hasEBFabFactory() == dst.hasEBFabFactory()) {

        explicit_swap = false;

    }


    if (!explicit_swap) {


        std::swap(dst, src);


    } else {

#ifdef AMREX_USE_GPU

        if (Gpu::inLaunchRegion() && dst.isFusingCandidate()) {

            auto const& dstma = dst.arrays();

            auto const& srcma = src.arrays();

            ParallelFor(dst, nghost, numcomp,

            [=] AMREX_GPU_DEVICE (int box_no, int i, int j, int k, int n) noexcept

            {

                const auto tmp                 = dstma[box_no](i,j,k,n+dstcomp);

                dstma[box_no](i,j,k,n+dstcomp) = srcma[box_no](i,j,k,n+srccomp);

                srcma[box_no](i,j,k,n+srccomp) = tmp;

            });

            if (!Gpu::inNoSyncRegion()) {

                Gpu::streamSynchronize();

            }

        } else

#endif

        {

#ifdef AMREX_USE_OMP

#pragma omp parallel if (Gpu::notInLaunchRegion())

#endif

            for (MFIter mfi(dst,TilingIfNotGPU()); mfi.isValid(); ++mfi)

            {

                const Box& bx = mfi.growntilebox(nghost);

                if (bx.ok()) {

                    auto sfab = src.array(mfi);

                    auto dfab = dst.array(mfi);

                    AMREX_HOST_DEVICE_PARALLEL_FOR_4D( bx, numcomp, i, j, k, n,

                    {

                        const auto tmp        = dfab(i,j,k,n+dstcomp);

                        dfab(i,j,k,n+dstcomp) = sfab(i,j,k,n+srccomp);

                        sfab(i,j,k,n+srccomp) = tmp;

                    });

                }

            }

        }

    }

}


template <BaseFabType FAB>

void


Subtract (FabArray<FAB>& dst, FabArray<FAB> const& src, int srccomp, int dstcomp, int numcomp, int nghost)

{

    Subtract(dst,src,srccomp,dstcomp,numcomp,IntVect(nghost));

}


template <BaseFabType FAB>

void


Subtract (FabArray<FAB>& dst, FabArray<FAB> const& src, int srccomp, int dstcomp, int numcomp, const IntVect& nghost)

{

#ifdef AMREX_USE_GPU

    if (Gpu::inLaunchRegion() && dst.isFusingCandidate()) {

        auto const& dstfa = dst.arrays();

        auto const& srcfa = src.const_arrays();

        ParallelFor(dst, nghost, numcomp,

        [=] AMREX_GPU_DEVICE (int box_no, int i, int j, int k, int n) noexcept

        {

            dstfa[box_no](i,j,k,n+dstcomp) -= srcfa[box_no](i,j,k,n+srccomp);

        });

        if (!Gpu::inNoSyncRegion()) {

            Gpu::streamSynchronize();

        }

    } else

#endif

    {

#ifdef AMREX_USE_OMP

#pragma omp parallel if (Gpu::notInLaunchRegion())

#endif

        for (MFIter mfi(dst,TilingIfNotGPU()); mfi.isValid(); ++mfi)

        {

            const Box& bx = mfi.growntilebox(nghost);

            if (bx.ok())

            {

                auto const srcFab = src.array(mfi);

                auto       dstFab = dst.array(mfi);

                AMREX_HOST_DEVICE_PARALLEL_FOR_4D( bx, numcomp, i, j, k, n,

                {

                    dstFab(i,j,k,n+dstcomp) -= srcFab(i,j,k,n+srccomp);

                });

            }

        }

    }

}


template <BaseFabType FAB>

void


Multiply (FabArray<FAB>& dst, FabArray<FAB> const& src, int srccomp, int dstcomp, int numcomp, int nghost)

{

    Multiply(dst,src,srccomp,dstcomp,numcomp,IntVect(nghost));

}


template <BaseFabType FAB>

void


Multiply (FabArray<FAB>& dst, FabArray<FAB> const& src, int srccomp, int dstcomp, int numcomp, const IntVect& nghost)

{

#ifdef AMREX_USE_GPU

    if (Gpu::inLaunchRegion() && dst.isFusingCandidate()) {

        auto const& dstfa = dst.arrays();

        auto const& srcfa = src.const_arrays();

        ParallelFor(dst, nghost, numcomp,

        [=] AMREX_GPU_DEVICE (int box_no, int i, int j, int k, int n) noexcept

        {

            dstfa[box_no](i,j,k,n+dstcomp) *= srcfa[box_no](i,j,k,n+srccomp);

        });

        if (!Gpu::inNoSyncRegion()) {

            Gpu::streamSynchronize();

        }

    } else

#endif

    {

#ifdef AMREX_USE_OMP

#pragma omp parallel if (Gpu::notInLaunchRegion())

#endif

        for (MFIter mfi(dst,TilingIfNotGPU()); mfi.isValid(); ++mfi)

        {

            const Box& bx = mfi.growntilebox(nghost);

            if (bx.ok())

            {

                auto const srcFab = src.array(mfi);

                auto       dstFab = dst.array(mfi);

                AMREX_HOST_DEVICE_PARALLEL_FOR_4D( bx, numcomp, i, j, k, n,

                {

                    dstFab(i,j,k,n+dstcomp) *= srcFab(i,j,k,n+srccomp);

                });

            }

        }

    }

}


template <BaseFabType FAB>

void


Divide (FabArray<FAB>& dst, FabArray<FAB> const& src, int srccomp, int dstcomp, int numcomp, int nghost)

{

    Divide(dst,src,srccomp,dstcomp,numcomp,IntVect(nghost));

}


template <BaseFabType FAB>

void


Divide (FabArray<FAB>& dst, FabArray<FAB> const& src, int srccomp, int dstcomp, int numcomp, const IntVect& nghost)

{

#ifdef AMREX_USE_GPU

    if (Gpu::inLaunchRegion() && dst.isFusingCandidate()) {

        auto const& dstfa = dst.arrays();

        auto const& srcfa = src.const_arrays();

        ParallelFor(dst, nghost, numcomp,

        [=] AMREX_GPU_DEVICE (int box_no, int i, int j, int k, int n) noexcept

        {

            dstfa[box_no](i,j,k,n+dstcomp) /= srcfa[box_no](i,j,k,n+srccomp);

        });

        if (!Gpu::inNoSyncRegion()) {

            Gpu::streamSynchronize();

        }

    } else

#endif

    {

#ifdef AMREX_USE_OMP

#pragma omp parallel if (Gpu::notInLaunchRegion())

#endif

        for (MFIter mfi(dst,TilingIfNotGPU()); mfi.isValid(); ++mfi)

        {

            const Box& bx = mfi.growntilebox(nghost);

            if (bx.ok())

            {

                auto const srcFab = src.array(mfi);

                auto       dstFab = dst.array(mfi);

                AMREX_HOST_DEVICE_PARALLEL_FOR_4D( bx, numcomp, i, j, k, n,

                {

                    dstFab(i,j,k,n+dstcomp) /= srcFab(i,j,k,n+srccomp);

                });

            }

        }

    }

}


template <BaseFabType FAB>

void


Abs (FabArray<FAB>& fa, int icomp, int numcomp, int nghost)

{

    Abs(fa,icomp,numcomp,IntVect(nghost));

}


template <BaseFabType FAB>

void


Abs (FabArray<FAB>& fa, int icomp, int numcomp, const IntVect& nghost)

{

#ifdef AMREX_USE_GPU

    if (Gpu::inLaunchRegion() && fa.isFusingCandidate()) {

        auto const& fabarr = fa.arrays();

        ParallelFor(fa, nghost, numcomp,

        [=] AMREX_GPU_DEVICE (int box_no, int i, int j, int k, int n) noexcept

        {

            fabarr[box_no](i,j,k,n+icomp) = std::abs(fabarr[box_no](i,j,k,n+icomp));

        });

        if (!Gpu::inNoSyncRegion()) {

            Gpu::streamSynchronize();

        }

    } else

#endif

    {

#ifdef AMREX_USE_OMP

#pragma omp parallel if (Gpu::notInLaunchRegion())

#endif

        for (MFIter mfi(fa,TilingIfNotGPU()); mfi.isValid(); ++mfi)

        {

            const Box& bx = mfi.growntilebox(nghost);

            if (bx.ok())

            {

                auto const& fab = fa.array(mfi);

                AMREX_HOST_DEVICE_PARALLEL_FOR_4D( bx, numcomp, i, j, k, n,

                {

                    fab(i,j,k,n+icomp) = std::abs(fab(i,j,k,n+icomp));

                });

            }

        }

    }

}


template <BaseFabType FAB>

void


prefetchToHost (FabArray<FAB> const& fa, const bool synchronous = true)

{

#ifdef AMREX_USE_GPU

    if (fa.arena()->isManaged()) {

        for (MFIter mfi(fa, MFItInfo().SetDeviceSync(synchronous)); mfi.isValid(); ++mfi) {

            fa.prefetchToHost(mfi);

        }

    }

#else

    amrex::ignore_unused(fa,synchronous);

#endif

}


template <BaseFabType FAB>

void


prefetchToDevice (FabArray<FAB> const& fa, const bool synchronous = true)

{

#ifdef AMREX_USE_GPU

    if (fa.arena()->isManaged()) {

        for (MFIter mfi(fa, MFItInfo().SetDeviceSync(synchronous)); mfi.isValid(); ++mfi) {

            fa.prefetchToDevice(mfi);

        }

    }

#else

    amrex::ignore_unused(fa,synchronous);

#endif

}


template <BaseFabType FAB, BaseFabType IFAB>

void


OverrideSync (FabArray<FAB> & fa, FabArray<IFAB> const& msk, const Periodicity& period)

{

    BL_PROFILE("OverrideSync()");


    OverrideSync_nowait(fa, msk, period);

    OverrideSync_finish(fa);

}


template <BaseFabType FAB, BaseFabType IFAB>

void


OverrideSync_nowait (FabArray<FAB> & fa, FabArray<IFAB> const& msk, const Periodicity& period)

{

    BL_PROFILE("OverrideSync_nowait()");

    AMREX_ASSERT_WITH_MESSAGE(!fa.os_temp, "OverrideSync_nowait() called when already in progress.");


    if (fa.ixType().cellCentered()) { return; }


    const int ncomp = fa.nComp();


#ifdef AMREX_USE_GPU

    if (Gpu::inLaunchRegion() && fa.isFusingCandidate()) {

        auto const&  fabarr = fa.arrays();

        auto const& ifabarr = msk.const_arrays();

        ParallelFor(fa, IntVect(0), ncomp,

        [=] AMREX_GPU_DEVICE (int box_no, int i, int j, int k, int n) noexcept

        {

            if (!ifabarr[box_no](i,j,k)) { fabarr[box_no](i,j,k,n) = 0; }

        });

        if (!Gpu::inNoSyncRegion()) {

            Gpu::streamSynchronize();

        }

    } else

#endif

    {

#ifdef AMREX_USE_OMP

#pragma omp parallel if (Gpu::notInLaunchRegion())

#endif

        for (MFIter mfi(fa,TilingIfNotGPU()); mfi.isValid(); ++mfi)

        {

            const Box& bx = mfi.tilebox();

            auto fab = fa.array(mfi);

            auto const ifab = msk.array(mfi);

            AMREX_HOST_DEVICE_PARALLEL_FOR_4D( bx, ncomp, i, j, k, n,

            {

                if (!ifab(i,j,k)) { fab(i,j,k,n) = 0; }

            });

        }

    }


    fa.os_temp = std::make_unique< FabArray<FAB> > ( fa.boxArray(), fa.DistributionMap(),

                                                     ncomp, 0, MFInfo(), fa.Factory() );

    fa.os_temp->setVal(0);

    fa.os_temp->ParallelCopy_nowait(fa, period, FabArrayBase::ADD);

}


template <BaseFabType FAB>

void


OverrideSync_finish (FabArray<FAB> & fa)

{

    BL_PROFILE("OverrideSync_finish()");


    if (fa.ixType().cellCentered()) { return; }


    fa.os_temp->ParallelCopy_finish();

    amrex::Copy(fa, *(fa.os_temp), 0, 0, fa.nComp(), 0);


    fa.os_temp.reset();

}


template <BaseFabType FAB>

void


dtoh_memcpy (FabArray<FAB>& dst, FabArray<FAB> const& src,

             int scomp, int dcomp, int ncomp)

{

    AMREX_ASSERT(isMFIterSafe(dst, src));

    AMREX_ASSERT(dst.nGrowVect() == src.nGrowVect());

#ifdef AMREX_USE_GPU

    for (MFIter mfi(dst); mfi.isValid(); ++mfi) {

        void* pdst = dst[mfi].dataPtr(dcomp);

        void const* psrc = src[mfi].dataPtr(scomp);

        Gpu::dtoh_memcpy_async(pdst, psrc, dst[mfi].nBytes(mfi.fabbox(), ncomp));

    }

#else

    Copy(dst, src, scomp, dcomp, ncomp, dst.nGrowVect());

#endif

}


template <BaseFabType FAB>

void


dtoh_memcpy (FabArray<FAB>& dst, FabArray<FAB> const& src)

{

    dtoh_memcpy(dst, src, 0, 0, dst.nComp());

}


template <BaseFabType FAB>

void


htod_memcpy (FabArray<FAB>& dst, FabArray<FAB> const& src,

             int scomp, int dcomp, int ncomp)

{

    AMREX_ASSERT(isMFIterSafe(dst, src));

    AMREX_ASSERT(dst.nGrowVect() == src.nGrowVect());

#ifdef AMREX_USE_GPU

    for (MFIter mfi(dst); mfi.isValid(); ++mfi) {

        void* pdst = dst[mfi].dataPtr(dcomp);

        void const* psrc = src[mfi].dataPtr(scomp);

        Gpu::htod_memcpy_async(pdst, psrc, dst[mfi].nBytes(mfi.fabbox(), ncomp));

    }

#else

    Copy(dst, src, scomp, dcomp, ncomp, dst.nGrowVect());

#endif

}


template <BaseFabType FAB>

void


htod_memcpy (FabArray<FAB>& dst, FabArray<FAB> const& src)

{

    htod_memcpy(dst, src, 0, 0, dst.nComp());

}


template <BaseFabType FAB>

IntVect


indexFromValue (FabArray<FAB> const& mf, int comp, IntVect const& nghost,

                typename FAB::value_type value)

{

    IntVect loc;


#ifdef AMREX_USE_GPU

    if (Gpu::inLaunchRegion())

    {

        amrex::Gpu::Buffer<int> aa({0,AMREX_D_DECL(0,0,0)});

        int* p = aa.data();

        // This is a device ptr to 1+AMREX_SPACEDIM int zeros.

        // The first is used as an atomic bool and the others for intvect.

        if (mf.isFusingCandidate()) {

            auto const& ma = mf.const_arrays();

            ParallelFor(mf, nghost, [=] AMREX_GPU_DEVICE (int box_no, int i, int j, int k) noexcept

            {

                int* flag = p;

                if (*flag == 0) {

                    if (ma[box_no](i,j,k,comp) == value) {

                        if (Gpu::Atomic::Exch(flag,1) == 0) {

                            AMREX_D_TERM(p[1] = i;,

                                         p[2] = j;,

                                         p[3] = k;);

                        }

                    }

                }

            });

        } else {

            for (MFIter mfi(mf,MFItInfo().SetDeviceSync(false)); mfi.isValid(); ++mfi) {

                const Box& bx = amrex::grow(mfi.validbox(), nghost);

                auto const& arr = mf.const_array(mfi);

                amrex::ParallelFor(bx, [=] AMREX_GPU_DEVICE (int i, int j, int k) noexcept

                {

                    int* flag = p;

                    if (*flag == 0) {

                        if (arr(i,j,k,comp) == value) {

                            if (Gpu::Atomic::Exch(flag,1) == 0) {

                                AMREX_D_TERM(p[1] = i;,

                                             p[2] = j;,

                                             p[3] = k;);

                            }

                        }

                    }

                });

            }

        }

        int const* tmp = aa.copyToHost();

        AMREX_D_TERM(loc[0] = tmp[1];,

                     loc[1] = tmp[2];,

                     loc[2] = tmp[3];);

    }

    else

#endif

    {

        bool f = false;

#ifdef AMREX_USE_OMP

#pragma omp parallel

#endif

        {

            IntVect priv_loc = IntVect::TheMinVector();

            for (MFIter mfi(mf,true); mfi.isValid(); ++mfi)

            {

                const Box& bx = mfi.growntilebox(nghost);

                auto const& fab = mf.const_array(mfi);

                AMREX_LOOP_3D(bx, i, j, k,

                {

                    if (fab(i,j,k,comp) == value) {

                        priv_loc = IntVect(AMREX_D_DECL(i,j,k));

                    }

                });

            }


            if (priv_loc.allGT(IntVect::TheMinVector())) {

                bool old;

// we should be able to test on _OPENMP < 201107 for capture (version 3.1)

// but we must work around a bug in gcc < 4.9

// And, with NVHPC 21.9 to <23.1, we saw an ICE with the atomic capture (NV bug: #3390723)

#if defined(AMREX_USE_OMP) && defined(_OPENMP) && (_OPENMP < 201307 || (defined(__NVCOMPILER) && __NVCOMPILER_MAJOR__ < 23)) // OpenMP 4.0

#pragma omp critical (amrex_indexfromvalue)

#elif defined(AMREX_USE_OMP)

#pragma omp atomic capture

#endif

                {

                    old = f;

                    f = true;

                }


                if (old == false) { loc = priv_loc; }

            }

        }

    }


    return loc;

}


template <BaseFabType FAB>

typename FAB::value_type


Dot (FabArray<FAB> const& x, int xcomp, FabArray<FAB> const& y, int ycomp, int ncomp,

     IntVect const& nghost, bool local = false)

{

    BL_ASSERT(x.boxArray() == y.boxArray());

    BL_ASSERT(x.DistributionMap() == y.DistributionMap());

    BL_ASSERT(x.nGrowVect().allGE(nghost) && y.nGrowVect().allGE(nghost));


    BL_PROFILE("amrex::Dot()");


    using T = typename FAB::value_type;

    auto sm = T(0.0);

#ifdef AMREX_USE_GPU

    if (Gpu::inLaunchRegion()) {

        auto const& xma = x.const_arrays();

        auto const& yma = y.const_arrays();

        sm = ParReduce(TypeList<ReduceOpSum>{}, TypeList<T>{}, x, nghost,

        [=] AMREX_GPU_DEVICE (int box_no, int i, int j, int k) noexcept -> GpuTuple<T>

        {

            auto t = T(0.0);

            auto const& xfab = xma[box_no];

            auto const& yfab = yma[box_no];

            for (int n = 0; n < ncomp; ++n) {

                t += xfab(i,j,k,xcomp+n) * yfab(i,j,k,ycomp+n);

            }

            return t;

        });

    } else

#endif

    {

#ifdef AMREX_USE_OMP

#pragma omp parallel if (!system::regtest_reduction) reduction(+:sm)

#endif

        for (MFIter mfi(x,true); mfi.isValid(); ++mfi)

        {

            Box const& bx = mfi.growntilebox(nghost);

            auto const& xfab = x.const_array(mfi);

            auto const& yfab = y.const_array(mfi);

            AMREX_LOOP_4D(bx, ncomp, i, j, k, n,

            {

                sm += xfab(i,j,k,xcomp+n) * yfab(i,j,k,ycomp+n);

            });

        }

    }


    if (!local) {

        ParallelAllReduce::Sum(sm, ParallelContext::CommunicatorSub());

    }


    return sm;

}


template <BaseFabType FAB>

typename FAB::value_type


Dot (FabArray<FAB> const& x, int xcomp, int ncomp, IntVect const& nghost, bool local = false)

{

    BL_ASSERT(x.nGrowVect().allGE(nghost));


    BL_PROFILE("amrex::Dot()");


    using T = typename FAB::value_type;

    auto sm = T(0.0);

#ifdef AMREX_USE_GPU

    if (Gpu::inLaunchRegion()) {

        auto const& xma = x.const_arrays();

        sm = ParReduce(TypeList<ReduceOpSum>{}, TypeList<T>{}, x, nghost,

        [=] AMREX_GPU_DEVICE (int box_no, int i, int j, int k) noexcept -> GpuTuple<T>

        {

            auto t = T(0.0);

            auto const& xfab = xma[box_no];

            for (int n = 0; n < ncomp; ++n) {

                auto v = xfab(i,j,k,xcomp+n);

                t += v*v;

            }

            return t;

        });

    } else

#endif

    {

#ifdef AMREX_USE_OMP

#pragma omp parallel if (!system::regtest_reduction) reduction(+:sm)

#endif

        for (MFIter mfi(x,true); mfi.isValid(); ++mfi)

        {

            Box const& bx = mfi.growntilebox(nghost);

            auto const& xfab = x.const_array(mfi);

            AMREX_LOOP_4D(bx, ncomp, i, j, k, n,

            {

                auto v = xfab(i,j,k,xcomp+n);

                sm += v*v;

            });

        }

    }


    if (!local) {

        ParallelAllReduce::Sum(sm, ParallelContext::CommunicatorSub());

    }


    return sm;

}


template <BaseFabType IFAB, BaseFabType FAB>

typename FAB::value_type


Dot (FabArray<IFAB> const& mask, FabArray<FAB> const& x, int xcomp,

     FabArray<FAB> const& y, int ycomp, int ncomp, IntVect const& nghost,

     bool local = false)

{

    BL_ASSERT(x.boxArray() == y.boxArray() && x.boxArray() == mask.boxArray());

    BL_ASSERT(x.DistributionMap() == y.DistributionMap() && x.DistributionMap() == mask.DistributionMap());

    BL_ASSERT(x.nGrowVect().allGE(nghost) && y.nGrowVect().allGE(nghost) &&

              mask.nGrowVect().allGE(nghost));


    BL_PROFILE("amrex::Dot()");


    using T = typename FAB::value_type;

    auto sm = T(0.0);

#ifdef AMREX_USE_GPU

    if (Gpu::inLaunchRegion()) {

        auto const& mma = mask.const_arrays();

        auto const& xma = x.const_arrays();

        auto const& yma = y.const_arrays();

        sm = ParReduce(TypeList<ReduceOpSum>{}, TypeList<T>{}, x, nghost,

        [=] AMREX_GPU_DEVICE (int box_no, int i, int j, int k) noexcept -> GpuTuple<T>

        {

            auto t = T(0.0);

            auto m = T(mma[box_no](i,j,k));

            if (m != 0) {

                auto const& xfab = xma[box_no];

                auto const& yfab = yma[box_no];

                for (int n = 0; n < ncomp; ++n) {

                    t += xfab(i,j,k,xcomp+n) * yfab(i,j,k,ycomp+n);

                }

            }

            return t*m;

        });

    } else

#endif

    {

#ifdef AMREX_USE_OMP

#pragma omp parallel if (!system::regtest_reduction) reduction(+:sm)

#endif

        for (MFIter mfi(x,true); mfi.isValid(); ++mfi)

        {

            Box const& bx = mfi.growntilebox(nghost);

            auto const& mfab = mask.const_array(mfi);

            auto const& xfab = x.const_array(mfi);

            auto const& yfab = y.const_array(mfi);

            AMREX_LOOP_4D(bx, ncomp, i, j, k, n,

            {

                auto m = T(mfab(i,j,k));

                sm += m * xfab(i,j,k,xcomp+n) * yfab(i,j,k,ycomp+n);

            });

        }

    }


    if (!local) {

        ParallelAllReduce::Sum(sm, ParallelContext::CommunicatorSub());

    }


    return sm;

}


template <BaseFabType IFAB, BaseFabType FAB>

typename FAB::value_type


Dot (FabArray<IFAB> const& mask, FabArray<FAB> const& x, int xcomp, int ncomp,

     IntVect const& nghost, bool local = false)

{

    BL_ASSERT(x.boxArray() == mask.boxArray());

    BL_ASSERT(x.DistributionMap() == mask.DistributionMap());

    BL_ASSERT(x.nGrowVect().allGE(nghost) && mask.nGrowVect().allGE(nghost));


    BL_PROFILE("amrex::Dot()");


    using T = typename FAB::value_type;

    auto sm = T(0.0);

#ifdef AMREX_USE_GPU

    if (Gpu::inLaunchRegion()) {

        auto const& mma = mask.const_arrays();

        auto const& xma = x.const_arrays();

        sm = ParReduce(TypeList<ReduceOpSum>{}, TypeList<T>{}, x, nghost,

        [=] AMREX_GPU_DEVICE (int box_no, int i, int j, int k) noexcept -> GpuTuple<T>

        {

            auto t = T(0.0);

            auto m = T(mma[box_no](i,j,k));

            if (m != 0) {

                auto const& xfab = xma[box_no];

                for (int n = 0; n < ncomp; ++n) {

                    auto v = xfab(i,j,k,xcomp+n);

                    t += v*v;

                }

            }

            return t*m;

        });

    } else

#endif

    {

#ifdef AMREX_USE_OMP

#pragma omp parallel if (!system::regtest_reduction) reduction(+:sm)

#endif

        for (MFIter mfi(x,true); mfi.isValid(); ++mfi)

        {

            Box const& bx = mfi.growntilebox(nghost);

            auto const& mfab = mask.const_array(mfi);

            auto const& xfab = x.const_array(mfi);

            AMREX_LOOP_4D(bx, ncomp, i, j, k, n,

            {

                auto m = T(mfab(i,j,k));

                auto v = xfab(i,j,k,xcomp+n);

                sm += m*v*v;

            });

        }

    }


    if (!local) {

        ParallelAllReduce::Sum(sm, ParallelContext::CommunicatorSub());

    }


    return sm;

}


template <MultiFabLike MF>


void setVal (MF& dst, typename MF::value_type val)

{

    dst.setVal(val);

}


template <MultiFabLike MF>


void setBndry (MF& dst, typename MF::value_type val, int scomp, int ncomp)

{

    dst.setBndry(val, scomp, ncomp);

}


template <MultiFabLike MF>


void Scale (MF& dst, typename MF::value_type val, int scomp, int ncomp, int nghost)

{

    dst.mult(val, scomp, ncomp, nghost);

}


template <MultiFabLike DMF, MultiFabLike SMF>


void LocalCopy (DMF& dst, SMF const& src, int scomp, int dcomp,

                int ncomp, IntVect const& nghost)

{

    amrex::Copy(dst, src, scomp, dcomp, ncomp, nghost);

}


template <MultiFabLike MF>


void LocalAdd (MF& dst, MF const& src, int scomp, int dcomp,

               int ncomp, IntVect const& nghost)

{

    amrex::Add(dst, src, scomp, dcomp, ncomp, nghost);

}


template <MultiFabLike MF>


void Saxpy (MF& dst, typename MF::value_type a, MF const& src, int scomp, int dcomp,

            int ncomp, IntVect const& nghost)

{

    MF::Saxpy(dst, a, src, scomp, dcomp, ncomp, nghost);

}


template <MultiFabLike MF>


void Xpay (MF& dst, typename MF::value_type a, MF const& src, int scomp, int dcomp,

           int ncomp, IntVect const& nghost)

{

    MF::Xpay(dst, a, src, scomp, dcomp, ncomp, nghost);

}


template <MultiFabLike MF>


void Saxpy_Xpay (MF& dst, typename MF::value_type a_saxpy, MF const& src_saxpy,

                 typename MF::value_type a_xpay, MF const& src_xpay, int scomp, int dcomp,

                 int ncomp, IntVect const& nghost)

{

    MF::Saxpy_Xpay(dst, a_saxpy, src_saxpy, a_xpay, src_xpay, scomp, dcomp, ncomp, nghost);

}


template <MultiFabLike MF>


void Saxpy_Saxpy (MF& dst1, typename MF::value_type a1, MF const& src1,

                  MF& dst2, typename MF::value_type a2, MF const& src2, int scomp, int dcomp,

                  int ncomp, IntVect const& nghost)

{

    MF::Saxpy_Saxpy(dst1, a1, src1, dst2, a2, src2, scomp, dcomp, ncomp, nghost);

}


template <MultiFabLike MF>


void Saypy_Saxpy (MF& dst1, typename MF::value_type a1,

                  MF& dst2, typename MF::value_type a2, MF const& src, int scomp, int dcomp,

                  int ncomp, IntVect const& nghost)

{

    MF::Saypy_Saxpy(dst1, a1, dst2, a2, src, scomp, dcomp, ncomp, nghost);

}


template <MultiFabLike MF>


void LinComb (MF& dst,

              typename MF::value_type a, MF const& src_a, int acomp,

              typename MF::value_type b, MF const& src_b, int bcomp,

              int dcomp, int ncomp, IntVect const& nghost)

{

    MF::LinComb(dst, a, src_a, acomp, b, src_b, bcomp, dcomp, ncomp, nghost);

}


template <MultiFabLike MF>


void ParallelCopy (MF& dst, MF const& src, int scomp, int dcomp, int ncomp,

                   IntVect const& ng_src = IntVect(0),

                   IntVect const& ng_dst = IntVect(0),

                   Periodicity const& period = Periodicity::NonPeriodic())

{

    dst.ParallelCopy(src, scomp, dcomp, ncomp, ng_src, ng_dst, period);

}


template <MultiFabLike MF>

[[nodiscard]] typename MF::value_type


norminf (MF const& mf, int scomp, int ncomp, IntVect const& nghost,

         bool local = false)

{

    return mf.norminf(scomp, ncomp, nghost, local);

}


template <MultiFabLike MF, std::size_t N>


void setVal (Array<MF,N>& dst, typename MF::value_type val)

{

    for (auto& mf: dst) {

        mf.setVal(val);

    }

}


template <MultiFabLike MF, std::size_t N>


void setBndry (Array<MF,N>& dst, typename MF::value_type val, int scomp, int ncomp)

{

    for (auto& mf : dst) {

        mf.setBndry(val, scomp, ncomp);

    }

}


template <MultiFabLike MF, std::size_t N>


void Scale (Array<MF,N>& dst, typename MF::value_type val, int scomp, int ncomp,

            int nghost)

{

    for (auto& mf : dst) {

        mf.mult(val, scomp, ncomp, nghost);

    }

}


template <MultiFabLike DMF, MultiFabLike SMF, std::size_t N>


void LocalCopy (Array<DMF,N>& dst, Array<SMF,N> const& src, int scomp, int dcomp,

                int ncomp, IntVect const& nghost)

{

    for (std::size_t i = 0; i < N; ++i) {

        amrex::Copy(dst[i], src[i], scomp, dcomp, ncomp, nghost);

    }

}


template <MultiFabLike MF, std::size_t N>


void LocalAdd (Array<MF,N>& dst, Array<MF,N> const& src, int scomp, int dcomp,

               int ncomp, IntVect const& nghost)

{

    for (std::size_t i = 0; i < N; ++i) {

        amrex::Add(dst[i], src[i], scomp, dcomp, ncomp, nghost);

    }

}


template <MultiFabLike MF, std::size_t N>


void Saxpy (Array<MF,N>& dst, typename MF::value_type a,

            Array<MF,N> const& src, int scomp, int dcomp, int ncomp,

            IntVect const& nghost)

{

    for (std::size_t i = 0; i < N; ++i) {

        MF::Saxpy(dst[i], a, src[i], scomp, dcomp, ncomp, nghost);

    }

}


template <MultiFabLike MF, std::size_t N>


void Xpay (Array<MF,N>& dst, typename MF::value_type a,

           Array<MF,N> const& src, int scomp, int dcomp, int ncomp,

           IntVect const& nghost)

{

    for (std::size_t i = 0; i < N; ++i) {

        MF::Xpay(dst[i], a, src[i], scomp, dcomp, ncomp, nghost);

    }

}


template <MultiFabLike MF, std::size_t N>


void LinComb (Array<MF,N>& dst,

              typename MF::value_type a, Array<MF,N> const& src_a, int acomp,

              typename MF::value_type b, Array<MF,N> const& src_b, int bcomp,

              int dcomp, int ncomp, IntVect const& nghost)

{

    for (std::size_t i = 0; i < N; ++i) {

        MF::LinComb(dst[i], a, src_a[i], acomp, b, src_b[i], bcomp, dcomp, ncomp, nghost);

    }

}


template <MultiFabLike MF, std::size_t N>


void ParallelCopy (Array<MF,N>& dst, Array<MF,N> const& src,

                   int scomp, int dcomp, int ncomp,

                   IntVect const& ng_src = IntVect(0),

                   IntVect const& ng_dst = IntVect(0),

                   Periodicity const& period = Periodicity::NonPeriodic())

{

    for (std::size_t i = 0; i < N; ++i) {

        dst[i].ParallelCopy(src[i], scomp, dcomp, ncomp, ng_src, ng_dst, period);

    }

}


template <MultiFabLike MF, std::size_t N>

[[nodiscard]] typename MF::value_type


norminf (Array<MF,N> const& mf, int scomp, int ncomp, IntVect const& nghost,

         bool local = false)

{

    auto r = typename MF::value_type(0);

    for (std::size_t i = 0; i < N; ++i) {

        auto tmp = mf[i].norminf(scomp, ncomp, nghost, true);

        r = std::max(r,tmp);

    }

    if (!local) {

        ParallelAllReduce::Max(r, ParallelContext::CommunicatorSub());

    }

    return r;

}


template <MultiFabLike MF, std::size_t N>

requires (N > 0)


[[nodiscard]] int nComp (Array<MF,N> const& mf)

{

    return mf[0].nComp();

}


template <MultiFabLike MF, std::size_t N>

requires (N > 0)


[[nodiscard]] IntVect nGrowVect (Array<MF,N> const& mf)

{

    return mf[0].nGrowVect();

}


template <MultiFabLike MF, std::size_t N>

requires (N > 0)

[[nodiscard]] BoxArray const&


boxArray (Array<MF,N> const& mf)

{

    return mf[0].boxArray();

}


template <MultiFabLike MF, std::size_t N>

requires (N > 0)

[[nodiscard]] DistributionMapping const&


DistributionMap (Array<MF,N> const& mf)

{

    return mf[0].DistributionMap();

}


/*

 * \brief Return a mask indicating how many duplicates are in each point

 *

 * \param fa     input FabArray

 * \param nghost number of ghost cells included in counting

 * \param period periodicity

 */

template <class FAB>

FabArray<BaseFab<int>>


OverlapMask (FabArray<FAB> const& fa, IntVect const& nghost, Periodicity const& period)

{

    BL_PROFILE("OverlapMask()");


    const BoxArray& ba = fa.boxArray();

    const DistributionMapping& dm = fa.DistributionMap();


    FabArray<BaseFab<int>> mask(ba, dm, 1, nghost);

    mask.setVal(1);


    const std::vector<IntVect>& pshifts = period.shiftIntVect();


    Vector<Array4BoxTag<int> > tags;


    bool run_on_gpu = Gpu::inLaunchRegion();

    amrex::ignore_unused(run_on_gpu, tags);

#ifdef AMREX_USE_OMP

#pragma omp parallel if (!run_on_gpu)

#endif

    {

        std::vector< std::pair<int,Box> > isects;


        for (MFIter mfi(mask); mfi.isValid(); ++mfi)

        {

            const Box& bx = mask[mfi].box();

            auto const& arr = mask.array(mfi);


            for (const auto& iv : pshifts)

            {

                ba.intersections(bx+iv, isects, false, nghost);

                for (const auto& is : isects)

                {

                    Box const& b = is.second-iv;

                    if (iv == 0 && b == bx) { continue; }

#ifdef AMREX_USE_GPU

                    if (run_on_gpu) {

                        tags.push_back(Array4BoxTag<int>{.dfab = arr, .dbox = b});

                    } else

#endif

                    {

                        amrex::LoopConcurrentOnCpu(b, [=] (int i, int j, int k) noexcept

                        {

                            arr(i,j,k) += 1;

                        });

                    }

                }

            }

        }

    }


#ifdef AMREX_USE_GPU

    amrex::ParallelFor(tags, 1,

    [=] AMREX_GPU_DEVICE (int i, int j, int k, int n, Array4BoxTag<int> const& tag) noexcept

    {

        Gpu::Atomic::AddNoRet(tag.dfab.ptr(i,j,k,n), 1);

    });

#endif


    return mask;

}


}


#endif

BL_PROFILE
#define BL_PROFILE(a)
Definition AMReX_BLProfiler.H:551

BL_ASSERT
#define BL_ASSERT(EX)
Definition AMReX_BLassert.H:39

AMREX_ASSERT_WITH_MESSAGE
#define AMREX_ASSERT_WITH_MESSAGE(EX, MSG)
Definition AMReX_BLassert.H:37

AMREX_ASSERT
#define AMREX_ASSERT(EX)
Definition AMReX_BLassert.H:38

AMReX_Concepts.H

AMReX_FabArray.H

AMREX_HOST_DEVICE_PARALLEL_FOR_4D
#define AMREX_HOST_DEVICE_PARALLEL_FOR_4D(...)
Definition AMReX_GpuLaunchMacrosC.nolint.H:111

AMREX_GPU_DEVICE
#define AMREX_GPU_DEVICE
Definition AMReX_GpuQualifiers.H:18

AMREX_GPU_HOST_DEVICE
#define AMREX_GPU_HOST_DEVICE
Definition AMReX_GpuQualifiers.H:20

pdst
Real * pdst
Definition AMReX_HypreMLABecLap.cpp:1130

mask
Array4< int const  > mask
Definition AMReX_InterpFaceRegister.cpp:93

AMReX_LayoutData.H

AMREX_LOOP_3D
#define AMREX_LOOP_3D(bx, i, j, k, block)
Definition AMReX_Loop.nolint.H:4

AMREX_LOOP_4D
#define AMREX_LOOP_4D(bx, ncomp, i, j, k, n, block)
Definition AMReX_Loop.nolint.H:16

AMReX_ParReduce.H

AMReX_Print.H

AMREX_D_TERM
#define AMREX_D_TERM(a, b, c)
Definition AMReX_SPACE.H:172

AMREX_D_DECL
#define AMREX_D_DECL(a, b, c)
Definition AMReX_SPACE.H:171

amrex::AllPrint
Print on all processors of the default communicator.
Definition AMReX_Print.H:113

amrex::Arena::isManaged
virtual bool isManaged() const
Check whether it is managed GPU memory.
Definition AMReX_Arena.cpp:88

amrex::Arena::isDevice
virtual bool isDevice() const
Check whether it is non-managed GPU device memory.
Definition AMReX_Arena.cpp:100

amrex::BoxArray
Reference-counted collection of Boxes.
Definition AMReX_BoxArray.H:676

amrex::BoxArray::intersections
std::vector< std::pair< int, Box > > intersections(const Box &bx) const
Return all intersections of bx with this BoxArray.
Definition AMReX_BoxArray.cpp:1186

amrex::BoxND< 3 >

amrex::BoxND::contains
__host__ __device__ bool contains(const IntVectND< dim > &p) const noexcept
Return true if argument is contained within BoxND.
Definition AMReX_Box.H:233

amrex::BoxND::ok
__host__ __device__ bool ok() const noexcept
Return true if high bounds are >= low bounds and the index type is valid.
Definition AMReX_Box.H:229

amrex::DistributionMapping
Calculates the distribution of FABs to MPI processes.
Definition AMReX_DistributionMapping.H:51

amrex::FabArrayBase::nGrowVect
IntVect nGrowVect() const noexcept
Definition AMReX_FabArrayBase.H:80

amrex::FabArrayBase::isFusingCandidate
bool isFusingCandidate() const noexcept
Is this a good candidate for kernel fusing?
Definition AMReX_FabArrayBase.cpp:2705

amrex::FabArrayBase::ixType
IndexType ixType() const noexcept
Return index type.
Definition AMReX_FabArrayBase.H:86

amrex::FabArrayBase::DistributionMap
const DistributionMapping & DistributionMap() const noexcept
Return constant reference to associated DistributionMapping.
Definition AMReX_FabArrayBase.H:130

amrex::FabArrayBase::ADD
@ ADD
Definition AMReX_FabArrayBase.H:393

amrex::FabArrayBase::nComp
int nComp() const noexcept
Return number of variables (aka components) associated with each point.
Definition AMReX_FabArrayBase.H:83

amrex::FabArrayBase::boxArray
const BoxArray & boxArray() const noexcept
Return a constant reference to the BoxArray that defines the valid region associated with this FabArr...
Definition AMReX_FabArrayBase.H:95

amrex::FabArray
An Array of FortranArrayBox(FAB)-like Objects.
Definition AMReX_FabArray.H:344

amrex::FabArray::mult
void mult(value_type val, int comp, int num_comp, int nghost=0)
Definition AMReX_FabArray.H:2968

amrex::FabArray::setBndry
void setBndry(value_type val)
Set all values in the boundary region to val.
Definition AMReX_FabArray.H:2487

amrex::FabArray::os_temp
std::unique_ptr< FabArray< FAB > > os_temp
Definition AMReX_FabArray.H:1661

amrex::FabArray::Factory
const FabFactory< FAB > & Factory() const noexcept
Definition AMReX_FabArray.H:442

amrex::FabArray::prefetchToHost
void prefetchToHost(const MFIter &mfi) const noexcept
Definition AMReX_FabArray.H:541

amrex::FabArray::arrays
MultiArray4< typename FabArray< FAB >::value_type > arrays() noexcept
Definition AMReX_FabArray.H:633

amrex::FabArray::prefetchToDevice
void prefetchToDevice(const MFIter &mfi) const noexcept
Definition AMReX_FabArray.H:551

amrex::FabArray::arena
Arena * arena() const noexcept
Definition AMReX_FabArray.H:445

amrex::FabArray::const_arrays
MultiArray4< typename FabArray< FAB >::value_type const > const_arrays() const noexcept
Definition AMReX_FabArray.H:647

amrex::FabArray::setVal
void setVal(value_type val)
Set all components in the entire region of each FAB to val.
Definition AMReX_FabArray.H:2705

amrex::FabArray::array
Array4< typename FabArray< FAB >::value_type const > array(const MFIter &mfi) const noexcept
Definition AMReX_FabArray.H:561

amrex::FabArray::hasEBFabFactory
bool hasEBFabFactory() const noexcept
Definition AMReX_FabArray.H:449

amrex::FabArray::const_array
Array4< typename FabArray< FAB >::value_type const > const_array(const MFIter &mfi) const noexcept
Definition AMReX_FabArray.H:585

amrex::GpuTuple
GPU-compatible tuple.
Definition AMReX_Tuple.H:98

amrex::Gpu::Buffer
Definition AMReX_GpuBuffer.H:24

amrex::Gpu::Buffer::data
T const * data() const noexcept
Definition AMReX_GpuBuffer.H:51

amrex::IndexTypeND::cellCentered
__host__ __device__ bool cellCentered() const noexcept
True if the IndexTypeND is CELL based in all directions.
Definition AMReX_IndexType.H:102

amrex::IntVectND< 3 >

amrex::IntVectND::allGT
__host__ __device__ constexpr bool allGT(const IntVectND< dim > &rhs) const noexcept
Returns true if this is greater than argument for all components. NOTE: This is NOT a strict weak ord...
Definition AMReX_IntVect.H:517

amrex::IntVectND< 3 >::TheZeroVector
__host__ static __device__ constexpr IntVectND< dim > TheZeroVector() noexcept
This static member function returns a reference to a constant IntVectND object, all of whose dim argu...
Definition AMReX_IntVect.H:771

amrex::IntVectND< 3 >::TheMinVector
__host__ static __device__ constexpr IntVectND< dim > TheMinVector() noexcept
Definition AMReX_IntVect.H:819

amrex::MFIter
Iterator for looping ever tiles and boxes of amrex::FabArray based containers.
Definition AMReX_MFIter.H:88

amrex::MFIter::isValid
bool isValid() const noexcept
Is the iterator valid i.e. is it associated with a FAB?
Definition AMReX_MFIter.H:172

amrex::PODVector
Dynamically allocated vector for trivially copyable data.
Definition AMReX_PODVector.H:308

amrex::PODVector::data
T * data() noexcept
Definition AMReX_PODVector.H:666

amrex::Periodicity
This provides length of period for periodic domains. 0 means it is not periodic in that direction....
Definition AMReX_Periodicity.H:17

amrex::Periodicity::NonPeriodic
static const Periodicity & NonPeriodic() noexcept
Definition AMReX_Periodicity.cpp:52

amrex::Periodicity::shiftIntVect
std::vector< IntVect > shiftIntVect(IntVect const &nghost=IntVect(0)) const
Definition AMReX_Periodicity.cpp:8

amrex::Print::SetPrecision
Print & SetPrecision(int p)
Definition AMReX_Print.H:86

amrex::Vector
This class is a thin wrapper around std::vector. Unlike vector, Vector::operator[] provides bound che...
Definition AMReX_Vector.H:29

amrex::makeSingleCellBox
__host__ __device__ BoxND< dim > makeSingleCellBox(int i, int j, int k, IndexTypeND< dim > typ=IndexTypeND< dim >::TheCellType())
Create a single-cell box at coordinates (i,j,k).
Definition AMReX_Box.H:2458

amrex::grow
__host__ __device__ BoxND< dim > grow(const BoxND< dim > &b, int i) noexcept
Return a copy of b grown uniformly by i cells in every direction.
Definition AMReX_Box.H:1326

amrex::Array
std::array< T, N > Array
Definition AMReX_Array.H:31

amrex::ParallelAllReduce::Sum
void Sum(Gpu::DeviceVector< T > &v, MPI_Comm comm)
Definition AMReX_GpuParallelReduce.H:34

amrex::ParallelAllReduce::Max
void Max(KeyValuePair< K, V > &vi, MPI_Comm comm)
Definition AMReX_ParallelReduce.H:133

amrex::Swap
__host__ __device__ void Swap(T &t1, T &t2) noexcept
Definition AMReX_Algorithm.H:108

amrex::Gpu::Atomic::Exch
__host__ __device__ AMREX_FORCE_INLINE T Exch(T *address, T val) noexcept
Definition AMReX_GpuAtomic.H:487

amrex::Gpu::Atomic::AddNoRet
__host__ __device__ AMREX_FORCE_INLINE void AddNoRet(T *sum, T value) noexcept
Definition AMReX_GpuAtomic.H:283

amrex::Gpu::streamSynchronize
void streamSynchronize() noexcept
Definition AMReX_GpuDevice.H:310

amrex::Gpu::dtoh_memcpy_async
void dtoh_memcpy_async(void *p_h, const void *p_d, const std::size_t sz) noexcept
Definition AMReX_GpuDevice.H:435

amrex::Gpu::inLaunchRegion
bool inLaunchRegion() noexcept
Definition AMReX_GpuControl.H:88

amrex::Gpu::inNoSyncRegion
bool inNoSyncRegion() noexcept
Definition AMReX_GpuControl.H:148

amrex::Gpu::htod_memcpy_async
void htod_memcpy_async(void *p_d, const void *p_h, const std::size_t sz) noexcept
Definition AMReX_GpuDevice.H:421

amrex::ParallelContext::CommunicatorSub
MPI_Comm CommunicatorSub() noexcept
sub-communicator for current frame
Definition AMReX_ParallelContext.H:70

amrex
Definition AMReX_Amr.cpp:50

amrex::ignore_unused
__host__ __device__ void ignore_unused(const Ts &...)
No-op helper that marks variables as intentionally unused.
Definition AMReX.H:259

amrex::nComp
int nComp(FabArrayBase const &fa)
Definition AMReX_FabArrayBase.cpp:2852

amrex::Copy
void Copy(FabArray< DFAB > &dst, FabArray< SFAB > const &src, int srccomp, int dstcomp, int numcomp, int nghost)
Definition AMReX_FabArray.H:180

amrex::htod_memcpy
void htod_memcpy(FabArray< FAB > &dst, FabArray< FAB > const &src, int scomp, int dcomp, int ncomp)
Definition AMReX_FabArrayUtility.H:1476

amrex::OverrideSync_nowait
void OverrideSync_nowait(FabArray< FAB > &fa, FabArray< IFAB > const &msk, const Periodicity &period)
Definition AMReX_FabArrayUtility.H:1390

amrex::Add
void Add(FabArray< FAB > &dst, FabArray< FAB > const &src, int srccomp, int dstcomp, int numcomp, int nghost)
Definition AMReX_FabArray.H:239

amrex::Order::F
@ F

amrex::ParReduce
ReduceData< Ts... >::Type ParReduce(TypeList< Ops... > operation_list, TypeList< Ts... > type_list, FabArray< FAB > const &fa, IntVect const &nghost, F &&f)
Parallel reduce for MultiFab/FabArray. The reduce result is local and it's the user's responsibility ...
Definition AMReX_ParReduce.H:48

amrex::DistributionMap
DistributionMapping const & DistributionMap(FabArrayBase const &fa)
Definition AMReX_FabArrayBase.cpp:2867

amrex::nGrowVect
IntVect nGrowVect(FabArrayBase const &fa)
Definition AMReX_FabArrayBase.cpp:2857

amrex::Scale
void Scale(MF &dst, typename MF::value_type val, int scomp, int ncomp, int nghost)
dst *= val
Definition AMReX_FabArrayUtility.H:1875

amrex::Dot
FAB::value_type Dot(FabArray< FAB > const &x, int xcomp, FabArray< FAB > const &y, int ycomp, int ncomp, IntVect const &nghost, bool local=false)
Compute dot products of two FabArrays.
Definition AMReX_FabArrayUtility.H:1609

amrex::Saxpy_Xpay
void Saxpy_Xpay(MF &dst, typename MF::value_type a_saxpy, MF const &src_saxpy, typename MF::value_type a_xpay, MF const &src_xpay, int scomp, int dcomp, int ncomp, IntVect const &nghost)
dst += a_saxpy * src_saxpy followed by dst = src_xpay + a_xpay * dst
Definition AMReX_FabArrayUtility.H:1914

amrex::prefetchToDevice
void prefetchToDevice(FabArray< FAB > const &fa, const bool synchronous=true)
Definition AMReX_FabArrayUtility.H:1363

amrex::ReduceMin
FAB::value_type ReduceMin(FabArray< FAB > const &fa, int nghost, F &&f)
Definition AMReX_FabArrayUtility.H:304

amrex::ParallelFor
void ParallelFor(TypeList< CTOs... > ctos, std::array< int, sizeof...(CTOs)> const &runtime_options, T N, F &&f)
Definition AMReX_CTOParallelForImpl.H:202

amrex::OverlapMask
FabArray< BaseFab< int > > OverlapMask(FabArray< FAB > const &fa, IntVect const &nghost, Periodicity const &period)
Definition AMReX_FabArrayUtility.H:2117

amrex::prefetchToHost
void prefetchToHost(FabArray< FAB > const &fa, const bool synchronous=true)
Definition AMReX_FabArrayUtility.H:1348

amrex::isMFIterSafe
bool isMFIterSafe(const FabArrayBase &x, const FabArrayBase &y)
Definition AMReX_MFIter.H:252

amrex::Saxpy_Saxpy
void Saxpy_Saxpy(MF &dst1, typename MF::value_type a1, MF const &src1, MF &dst2, typename MF::value_type a2, MF const &src2, int scomp, int dcomp, int ncomp, IntVect const &nghost)
dst1 += a1 * src1 followed by dst2 += a2 * src2
Definition AMReX_FabArrayUtility.H:1923

amrex::indexFromValue
IntVect indexFromValue(FabArray< FAB > const &mf, int comp, IntVect const &nghost, typename FAB::value_type value)
Definition AMReX_FabArrayUtility.H:1501

amrex::LinComb
void LinComb(MF &dst, typename MF::value_type a, MF const &src_a, int acomp, typename MF::value_type b, MF const &src_b, int bcomp, int dcomp, int ncomp, IntVect const &nghost)
dst = a*src_a + b*src_b
Definition AMReX_FabArrayUtility.H:1941

amrex::ParallelCopy
void ParallelCopy(MF &dst, MF const &src, int scomp, int dcomp, int ncomp, IntVect const &ng_src=IntVect(0), IntVect const &ng_dst=IntVect(0), Periodicity const &period=Periodicity::NonPeriodic())
dst = src w/ MPI communication
Definition AMReX_FabArrayUtility.H:1951

amrex::Saypy_Saxpy
void Saypy_Saxpy(MF &dst1, typename MF::value_type a1, MF &dst2, typename MF::value_type a2, MF const &src, int scomp, int dcomp, int ncomp, IntVect const &nghost)
dst1 += a1 * dst2 followed by dst2 += a2 * src
Definition AMReX_FabArrayUtility.H:1932

amrex::Multiply
void Multiply(FabArray< FAB > &dst, FabArray< FAB > const &src, int srccomp, int dstcomp, int numcomp, int nghost)
Definition AMReX_FabArrayUtility.H:1214

amrex::Direction::y
@ y

amrex::Direction::x
@ x

amrex::IntVect
IntVectND< 3 > IntVect
IntVect is an alias for amrex::IntVectND instantiated with AMREX_SPACEDIM.
Definition AMReX_BaseFwd.H:38

amrex::Abs
void Abs(FabArray< FAB > &fa, int icomp, int numcomp, int nghost)
Definition AMReX_FabArrayUtility.H:1305

amrex::OverrideSync_finish
void OverrideSync_finish(FabArray< FAB > &fa)
Definition AMReX_FabArrayUtility.H:1437

amrex::single_task
void single_task(L &&f) noexcept
Definition AMReX_GpuLaunchFunctsC.H:1239

amrex::dtoh_memcpy
void dtoh_memcpy(FabArray< FAB > &dst, FabArray< FAB > const &src, int scomp, int dcomp, int ncomp)
Definition AMReX_FabArrayUtility.H:1451

amrex::LocalCopy
void LocalCopy(DMF &dst, SMF const &src, int scomp, int dcomp, int ncomp, IntVect const &nghost)
dst = src
Definition AMReX_FabArrayUtility.H:1882

amrex::TilingIfNotGPU
bool TilingIfNotGPU() noexcept
Definition AMReX_MFIter.H:12

amrex::setBndry
void setBndry(MF &dst, typename MF::value_type val, int scomp, int ncomp)
dst = val in ghost cells.
Definition AMReX_FabArrayUtility.H:1868

amrex::printCell
void printCell(FabArray< FAB > const &mf, const IntVect &cell, int comp=-1, const IntVect &ng=IntVect::TheZeroVector())
Definition AMReX_FabArrayUtility.H:1051

amrex::norminf
MF::value_type norminf(MF const &mf, int scomp, int ncomp, IntVect const &nghost, bool local=false)
Definition AMReX_FabArrayUtility.H:1961

amrex::ReduceLogicalOr
bool ReduceLogicalOr(FabArray< FAB > const &fa, int nghost, F &&f)
Definition AMReX_FabArrayUtility.H:904

amrex::LoopConcurrentOnCpu
void LoopConcurrentOnCpu(Dim3 lo, Dim3 hi, F const &f) noexcept
Definition AMReX_Loop.H:388

amrex::Xpay
void Xpay(MF &dst, typename MF::value_type a, MF const &src, int scomp, int dcomp, int ncomp, IntVect const &nghost)
dst = src + a * dst
Definition AMReX_FabArrayUtility.H:1906

amrex::Abort
void Abort(const std::string &msg)
Print a fatal-error message to stderr and abort execution.
Definition AMReX.cpp:241

amrex::int
const int[]
Definition AMReX_BLProfiler.cpp:1664

amrex::OverrideSync
void OverrideSync(FabArray< FAB > &fa, FabArray< IFAB > const &msk, const Periodicity &period)
Definition AMReX_FabArrayUtility.H:1379

amrex::Divide
void Divide(FabArray< FAB > &dst, FabArray< FAB > const &src, int srccomp, int dstcomp, int numcomp, int nghost)
Definition AMReX_FabArrayUtility.H:1260

amrex::ReduceLogicalAnd
bool ReduceLogicalAnd(FabArray< FAB > const &fa, int nghost, F &&f)
Definition AMReX_FabArrayUtility.H:757

amrex::ReduceMax
FAB::value_type ReduceMax(FabArray< FAB > const &fa, int nghost, F &&f)
Definition AMReX_FabArrayUtility.H:530

amrex::Subtract
void Subtract(FabArray< FAB > &dst, FabArray< FAB > const &src, int srccomp, int dstcomp, int numcomp, int nghost)
Definition AMReX_FabArrayUtility.H:1168

amrex::Saxpy
void Saxpy(MF &dst, typename MF::value_type a, MF const &src, int scomp, int dcomp, int ncomp, IntVect const &nghost)
dst += a * src
Definition AMReX_FabArrayUtility.H:1898

amrex::LocalAdd
void LocalAdd(MF &dst, MF const &src, int scomp, int dcomp, int ncomp, IntVect const &nghost)
dst += src
Definition AMReX_FabArrayUtility.H:1890

amrex::boxArray
BoxArray const & boxArray(FabArrayBase const &fa)
Definition AMReX_FabArrayBase.cpp:2862

amrex::ReduceSum
FAB::value_type ReduceSum(FabArray< FAB > const &fa, int nghost, F &&f)
Definition AMReX_FabArrayUtility.H:16

amrex::setVal
void setVal(MF &dst, typename MF::value_type val)
dst = val
Definition AMReX_FabArrayUtility.H:1861

amrex::Array4BoxTag
Definition AMReX_TagParallelFor.H:58

amrex::Array4BoxTag::dfab
Array4< T > dfab
Definition AMReX_TagParallelFor.H:59

amrex::DefinitelyNotHostRunnable
Definition AMReX_TypeTraits.H:94

amrex::MFInfo
FabArray memory allocation information.
Definition AMReX_FabArray.H:68

amrex::MFItInfo
Definition AMReX_MFIter.H:20

amrex::TypeList
Struct for holding types.
Definition AMReX_TypeList.H:13