Block-Structured AMR Software Framework
3 #include <AMReX_Config.H>
4 #include <AMReX_TypeTraits.H>
5 #include <AMReX_FabArray.H>
6 #include <AMReX_FArrayBox.H>
8 namespace amrex::NonLocalBC {
11 // [concept.IndexMapping]
12 //
15 template <typename T, typename... Args>
16 using Inverse_t = decltype(std::declval<T>().Inverse(std::declval<Args>()...));
19 template <typename T>
20 struct HasInverseMemFn : IsDetectedExact<Dim3, Inverse_t, T, Dim3> {};
24 template <class IndexMap>
26  : Conjunction<IsCallableR<Dim3, IndexMap&, const Dim3&>,
27  HasInverseMemFn<const IndexMap&>> {};
30 // [IndexMapping.MultiBlockIndexMapping]
31 //
51  [[nodiscard]] AMREX_GPU_HOST_DEVICE Dim3 operator()(Dim3 i) const noexcept {
52  int iv[3]{i.x, i.y, i.z};
53  int iv_new[3]{};
54  for (int d = 0; d < AMREX_SPACEDIM; ++d) {
55  iv_new[d] = sign[d] * (iv[permutation[d]] - offset[d]);
56  }
57  return {iv_new[0], iv_new[1], iv_new[2]};
58  }
66  [[nodiscard]] AMREX_GPU_HOST_DEVICE Dim3 Inverse(Dim3 i) const noexcept {
67  int iv_new[3]{i.x, i.y, i.z};
68  int iv[3]{};
69  for (int d = 0; d < AMREX_SPACEDIM; ++d) {
70  AMREX_ASSERT(sign[d] == 1 || sign[d] == -1);
71  iv[permutation[d]] = iv_new[d] * sign[d] + offset[d];
72  }
73  return {iv[0], iv[1], iv[2]};
74  }
76  [[nodiscard]] IndexType operator()(IndexType it) const noexcept {
77  return IndexType{IntVect{AMREX_D_DECL(it[permutation[0]], it[permutation[1]], it[permutation[2]])}};
78  }
80  [[nodiscard]] IndexType Inverse(IndexType it) const noexcept {
81  IntVect inverse_permutation;
82  for (int i = 0; i < AMREX_SPACEDIM; ++i) {
83  inverse_permutation[permutation[i]] = i;
84  }
85  return IndexType{IntVect{AMREX_D_DECL(it[inverse_permutation[0]], it[inverse_permutation[1]], it[inverse_permutation[2]])}};
86  }
87 };
100 template <typename DTOS>
101 std::enable_if_t<IsCallableR<Dim3, DTOS, Dim3>::value, IntVect>
102 Apply(DTOS const& dtos, const IntVect& iv)
103 {
104  Dim3 i = dtos(iv.dim3());
105  return IntVect{AMREX_D_DECL(i.x, i.y, i.z)};
106 }
116 template <typename DTOS>
117 std::enable_if_t<IsCallableR<Dim3, DTOS, Dim3>::value && !IsCallableR<IndexType, DTOS, IndexType>::value, Box>
118 Image (DTOS const& dtos, const Box& box)
119 {
120  IntVect mapped_smallEnd = Apply(dtos, box.smallEnd());
121  IntVect mapped_bigEnd = Apply(dtos, box.bigEnd());
122  IntVect smallEnd;
123  IntVect bigEnd;
124  for (int d = 0; d < AMREX_SPACEDIM; ++d) {
125  smallEnd[d] = std::min(mapped_smallEnd[d], mapped_bigEnd[d]);
126  bigEnd[d] = std::max(mapped_smallEnd[d], mapped_bigEnd[d]);
127  }
128  return Box{smallEnd, bigEnd, box.ixType()};
129 }
139 template <typename DTOS>
140 std::enable_if_t<IsCallableR<Dim3, DTOS, Dim3>::value && IsCallableR<IndexType, DTOS, IndexType>::value, Box>
141 Image (DTOS const& dtos, const Box& box)
142 {
143  // "Forget" the index type mapping and invoke Image without changing the index type.
144  Box srcbox = Image([&dtos](Dim3 d) { return dtos(d); }, box);
145  // Fix the index type of the resulting box
146  srcbox.setType(dtos(box.ixType()));
147  return srcbox;
148 }
161 template <typename DTOS>
162 std::enable_if_t<HasInverseMemFn<DTOS>::value, IntVect>
163 ApplyInverse(DTOS const& dtos, const IntVect& iv)
164 {
165  return Apply([&dtos](Dim3 i) { return dtos.Inverse(i); }, iv);
166 }
176 template <typename DTOS>
177 std::enable_if_t<HasInverseMemFn<DTOS>::value && !IsCallableR<IndexType, DTOS, IndexType>::value, Box>
178 InverseImage (DTOS const& dtos, const Box& box)
179 {
180  return Image([&dtos](Dim3 i) { return dtos.Inverse(i); }, box);
181 }
191 template <typename DTOS>
192 std::enable_if_t<HasInverseMemFn<DTOS>::value && IsCallableR<IndexType, DTOS, IndexType>::value, Box>
193 InverseImage (DTOS const& dtos, const Box& box)
194 {
195  return Image([&dtos](auto&& i) { return dtos.Inverse(i); }, box);
196 }
199 static_assert(IsIndexMapping<MultiBlockIndexMapping>(), // NOLINT(bugprone-throw-keyword-missing)
200  "MultiBlockIndexMapping is expected to satisfy IndexMapping");
203 // [class.MultiBlockCommMetaData]
204 //
216  template <typename DTOS,
217  typename = std::enable_if_t<IsIndexMapping<DTOS>::value>>
218  MultiBlockCommMetaData(const FabArrayBase& dst, const Box& dstbox, const FabArrayBase& src,
219  const IntVect& ngrow, DTOS const& dtos);
224  template <typename DTOS,
225  typename = std::enable_if_t<IsIndexMapping<DTOS>::value>>
227  const Box& dstbox, const BoxArray& srcba,
228  const DistributionMapping& srcdm, const IntVect& ngrow, DTOS const& dtos);
256  template <typename DTOS>
257  std::enable_if_t<IsIndexMapping<DTOS>::value>
258  define(const BoxArray& dstba, const DistributionMapping& dstdm, const Box& dstbox,
259  const BoxArray& srcba, const DistributionMapping& srcdm, const IntVect& ngrow,
260  DTOS const& dtos);
261 };
264 // [concept.FabProjection]
265 //
268 template <typename P, typename FAB>
270  : IsCallableR<typename FAB::value_type, P, Array4<const typename FAB::value_type>, Dim3, int>
271 {};
274 // [FabProjection.Identity]
275 // [IndexMapping.Identity]
280 struct Identity {
282  constexpr Dim3 operator()(Dim3 i) const noexcept { return i; }
284  [[nodiscard]] static constexpr Dim3 Inverse(Dim3 i) noexcept { return i; }
287  template <typename T>
288  constexpr T operator()(Array4<const T> array, Dim3 i, int comp = 0) const
289  noexcept(noexcept(array(i.x, i.y, i.z, comp))) {
290  return array(i.x, i.y, i.z, comp);
291  }
294  constexpr int operator()(int i) const noexcept { return i; }
295 };
296 static constexpr Identity identity{};
298 static_assert(sizeof(Identity) == 1 );
299 static_assert(std::is_trivially_default_constructible_v<Identity> );
300 static_assert(std::is_trivially_copy_assignable_v<Identity> );
301 static_assert(std::is_trivially_copy_constructible_v<Identity> );
302 static_assert(IsIndexMapping<Identity>() ); // NOLINT(bugprone-throw-keyword-missing)
303 static_assert(IsFabProjection<Identity, FArrayBox>() ); // NOLINT(bugprone-throw-keyword-missing)
306 // [FabProjection.MapComponents]
314 template <typename Base, typename Map = Identity> struct MapComponents {
315  static_assert(IsCallable<Base, Array4<const Real>, Dim3, int>::value,
316  "Base needs to be a callable function: (Array4<const T>, Dim3, i) -> auto.");
318  static_assert(IsCallableR<int, Map, int>::value,
319  "Map needs to be a callable function: int -> int.");
321  Base base;
322  Map map;
324  template <typename T,
325  typename = std::enable_if_t<IsCallable<Base, Array4<const T>, Dim3, int>::value>,
326  typename = std::enable_if_t<IsCallableR<int, Map, int>::value>>
327  constexpr decltype(auto) operator()(Array4<const T> array, Dim3 i, int comp) const
328  noexcept(noexcept(base(array, i, map(comp)))) {
329  return base(array, i, map(comp));
330  }
331 };
333 static_assert(std::is_trivially_copy_assignable<MapComponents<Identity>>() ); // NOLINT(bugprone-throw-keyword-missing)
334 static_assert(std::is_trivially_copy_constructible<MapComponents<Identity>>() ); // NOLINT(bugprone-throw-keyword-missing)
335 static_assert(IsFabProjection<MapComponents<Identity>, FArrayBox>() ); // NOLINT(bugprone-throw-keyword-missing)
338 // [FabProjection.MapComponents.SwapComponents]
345 template <int I, int J> struct SwapComponents {
346  static_assert(I >= 0 && J >= 0, "I >= 0 && J >= 0");
351  constexpr int operator()(int i) const noexcept {
352  const int map[2] = {I, J};
353  return i == I || i == J ? map[std::size_t(i == I)] : i;
354  }
355 };
357 template <int I> struct SwapComponents<I, -1> {
358  static_assert(I >= 0, "I >= 0");
360  int J;
361  constexpr int operator()(int i) const noexcept {
362  const int map[2] = {I, J};
363  return i == I || i == J ? map[std::size_t(i == I)] : i;
364  }
365 };
367 template <int J> struct SwapComponents<-1, J> {
368  static_assert(J >= 0, "J >= 0");
370  int I;
371  constexpr int operator()(int i) const noexcept {
372  const int map[2] = {I, J};
373  return i == I || i == J ? map[std::size_t(i == I)] : i;
374  }
375 };
377 template <> struct SwapComponents<-1, -1> {
378  int I;
379  int J;
380  constexpr int operator()(int i) const noexcept {
381  const int map[2] = {I, J};
382  return i == I || i == J ? map[std::size_t(i == I)] : i;
383  }
384 };
388 template <int I, int J> static constexpr SwapComponents<I, J> swap_indices{};
390 static_assert(sizeof(SwapComponents<0, 1>) == 1 );
391 static_assert(sizeof(DynamicSwapComponents) == 2 * sizeof(int) );
392 static_assert(sizeof(SwapComponents<0, -1>) == sizeof(int) );
393 static_assert(sizeof(SwapComponents<-1, 1>) == sizeof(int) );
394 static_assert(std::is_trivially_default_constructible<MapComponents<Identity, SwapComponents<0, 1>>>() ); // NOLINT(bugprone-throw-keyword-missing)
395 static_assert(std::is_trivially_copy_assignable<MapComponents<Identity, SwapComponents<0, 1>>>() ); // NOLINT(bugprone-throw-keyword-missing)
396 static_assert(std::is_trivially_copy_constructible<MapComponents<Identity, SwapComponents<0, 1>>>() ); // NOLINT(bugprone-throw-keyword-missing)
397 static_assert(IsFabProjection<MapComponents<Identity, SwapComponents<0, 1>>, FArrayBox>() ); // NOLINT(bugprone-throw-keyword-missing)
399 static_assert(swap_indices<0, 1>(0) == 1 );
400 static_assert(swap_indices<0, 1>(1) == 0 );
401 static_assert(swap_indices<0, 1>(2) == 2 );
402 static_assert(DynamicSwapComponents{0, 1}(0) == 1 );
403 static_assert(DynamicSwapComponents{0, 1}(1) == 0 );
404 static_assert(DynamicSwapComponents{0, 1}(2) == 2 );
407 // [class.CommData]
408 // [class.CommHandler]
415 struct CommData {
416 #ifdef AMREX_USE_MPI
433 #endif
434 };
436 #ifdef AMREX_USE_MPI
438 void PrepareCommBuffers(CommData& comm, const FabArrayBase::MapOfCopyComTagContainers& cctc,
439  int n_components, std::size_t object_size, std::size_t align);
442 void PostRecvs(CommData& recv, int mpi_tag);
445 void PostSends(CommData& send, int mpi_tag);
446 #endif
452 struct CommHandler {
453 #ifdef AMREX_USE_MPI
454  int mpi_tag{};
457 #endif
458 };
461 // [concept.DataPacking]
462 //
463 template <typename... Args>
464 using PrepareSendBuffers_t = decltype(PrepareSendBuffers(std::declval<Args>()...));
466 template <typename... Args>
467 using PrepareRecvBuffers_t = decltype(PrepareRecvBuffers(std::declval<Args>()...));
469 template <typename... Args>
470 using PackSendBuffers_t = decltype(PackSendBuffers(std::declval<Args>()...));
472 template <typename... Args>
473 using UnpackRecvBuffers_t = decltype(UnpackRecvBuffers(std::declval<Args>()...));
475 template <typename... Args>
476 using LocalCopy_t = decltype(LocalCopy(std::declval<Args>()...));
479 template <typename DP, typename FAB>
481  Conjunction<
482  IsDetected<LocalCopy_t, DP&, FabArray<FAB>&, const FabArray<FAB>&, const FabArrayBase::CopyComTagsContainer&>
483 #ifdef AMREX_USE_MPI
484  ,IsDetected<PrepareSendBuffers_t, DP&, FabArray<FAB>&, const FabArray<FAB>&, CommData&, const FabArrayBase::MapOfCopyComTagContainers&>,
485  IsDetected<PrepareRecvBuffers_t, DP&, FabArray<FAB>&, const FabArray<FAB>&, CommData&, const FabArrayBase::MapOfCopyComTagContainers&>,
486  IsDetected<PackSendBuffers_t, DP&, const FabArray<FAB>&, CommData&>,
487  IsDetected<UnpackRecvBuffers_t, DP&, FabArray<FAB>&, CommData&>
488 #endif
489  > {};
491 template <class FAB, class DTOS = Identity, class Proj = Identity>
492 std::enable_if_t<IsBaseFab<FAB>() && IsCallableR<Dim3, DTOS, Dim3>() && IsFabProjection<Proj, FAB>()>
493 local_copy_cpu (FabArray<FAB>& dest, const FabArray<FAB>& src, int dcomp, int scomp, int ncomp,
494  FabArrayBase::CopyComTagsContainer const& local_tags, DTOS const& dtos = DTOS{},
495  Proj const& proj = Proj{}) noexcept;
497 template <class FAB, class DTOS = Identity, class Proj = Identity>
498 std::enable_if_t<IsBaseFab<FAB>() && IsCallableR<Dim3, DTOS, Dim3>() && IsFabProjection<Proj, FAB>()>
499 unpack_recv_buffer_cpu (FabArray<FAB>& mf, int dcomp, int ncomp, Vector<char*> const& recv_data,
500  Vector<std::size_t> const& recv_size,
502  DTOS const& dtos = DTOS{}, Proj const& proj = Proj{}) noexcept;
504 #ifdef AMREX_USE_GPU
505 template <class FAB, class DTOS = Identity, class Proj = Identity>
506 std::enable_if_t<IsBaseFab<FAB>() && IsCallableR<Dim3, DTOS, Dim3>() && IsFabProjection<Proj, FAB>()>
507 local_copy_gpu (FabArray<FAB>& dest, const FabArray<FAB>& src, int dcomp, int scomp, int ncomp,
508  FabArrayBase::CopyComTagsContainer const& local_tags, DTOS const& dtos = DTOS{},
509  Proj const& proj = Proj{}) noexcept;
511 template <class FAB, class DTOS = Identity, class Proj = Identity>
512 std::enable_if_t<IsBaseFab<FAB>() && IsCallableR<Dim3, DTOS, Dim3>() && IsFabProjection<Proj, FAB>()>
513 unpack_recv_buffer_gpu (FabArray<FAB>& mf, int scomp, int ncomp,
514  Vector<char*> const& recv_data,
515  Vector<std::size_t> const& recv_size,
517  DTOS const& dtos = DTOS{}, Proj const& proj = Proj{});
518 #endif
521 // [DataPacking.PackComponents]
522 //
523 // PackComponents is the simplest data packing policy.
524 // This provides us with sane default behaviour that we can use when defining new
525 // data packing policies.
531  int n_components{0};
532 };
535 template <typename FAB>
536 std::enable_if_t<IsBaseFab<FAB>::value>
537 LocalCopy (const PackComponents& components, FabArray<FAB>& dest, const FabArray<FAB>& src,
538  const FabArrayBase::CopyComTagsContainer& local_tags) {
539 #ifdef AMREX_USE_GPU
540  if (Gpu::inLaunchRegion()) {
541  local_copy_gpu(dest, src, components.dest_component, components.src_component,
542  components.n_components, local_tags);
543  } else
544 #endif
545  {
546  local_copy_cpu(dest, src, components.dest_component, components.src_component,
547  components.n_components, local_tags);
548  }
549 }
551 #ifdef AMREX_USE_MPI
553 template <typename FAB>
554 std::enable_if_t<IsBaseFab<FAB>::value>
555 PrepareSendBuffers (const PackComponents& components, FabArray<FAB>& dest, const FabArray<FAB>& src,
557  using T = typename FAB::value_type;
558  ignore_unused(dest, src);
559  PrepareCommBuffers(comm, cctc, components.n_components, sizeof(T), alignof(T));
560 }
563 template <typename FAB>
564 std::enable_if_t<IsBaseFab<FAB>::value>
565 PrepareRecvBuffers (const PackComponents& components, FabArray<FAB>& dest, const FabArray<FAB>& src,
567  using T = typename FAB::value_type;
568  ignore_unused(dest, src);
569  PrepareCommBuffers(comm, cctc, components.n_components, sizeof(T), alignof(T));
570 }
573 template <typename FAB>
574 std::enable_if_t<IsBaseFab<FAB>::value>
575 PackSendBuffers (const PackComponents& components, const FabArray<FAB>& src, CommData& send) {
576 #ifdef AMREX_USE_GPU
577  if (Gpu::inLaunchRegion()) {
579, send.size, send.cctc);
580  } else
581 #endif // AMREX_USE_GPU
582  {
584, send.size, send.cctc);
585  }
586 }
589 template <typename FAB>
590 std::enable_if_t<IsBaseFab<FAB>::value>
591 UnpackRecvBuffers (const PackComponents& components, FabArray<FAB>& dest, const CommData& recv) {
592 #ifdef AMREX_USE_GPU
593  if (Gpu::inLaunchRegion()) {
594  unpack_recv_buffer_gpu(dest, components.dest_component, components.n_components,,
595  recv.size, recv.cctc);
596  } else
597 #endif // AMREX_USE_GPU
598  {
599  unpack_recv_buffer_cpu(dest, components.dest_component, components.n_components,,
600  recv.size, recv.cctc);
601  }
602 }
603 #endif // AMREX_USE_MPI
605 static_assert(IsDataPacking<PackComponents, FArrayBox>(), // NOLINT(bugprone-throw-keyword-missing)
606  "PackComponents is expected to satisfy the concept DataPacking.");
609 // [DataPacking.ApplyDtosAndProjectionOnReciever]
610 //
614 template <typename DTOS = Identity, typename FabProj = Identity>
616  constexpr ApplyDtosAndProjectionOnReciever() = default;
617  constexpr ApplyDtosAndProjectionOnReciever(const PackComponents& components, DTOS dtos_ = DTOS{}, FabProj proj_ = FabProj{})
618  : PackComponents(components), dtos(std::move(dtos_)), proj(std::move(proj_)) {}
620  DTOS dtos;
621  FabProj proj;
623  static_assert(IsCallableR<Dim3, DTOS, Dim3>(), "DTOS needs to be a callable: Dim3 -> Dim3");
624  static_assert(IsFabProjection<FabProj, FArrayBox>(), "FabProj needs to be at least a projection on FArrayBox.");
625 };
628 template <typename FAB, typename DTOS, typename FabProj>
629 std::enable_if_t<IsBaseFab<FAB>::value>
631  const FabArray<FAB>& src, const FabArrayBase::CopyComTagsContainer& local_tags) {
632  static_assert(IsFabProjection<FabProj, FAB>(), "FabProj needs to be a projection for given FAB type.");
633 #ifdef AMREX_USE_GPU
634  if (Gpu::inLaunchRegion()) {
635  local_copy_gpu(dest, src, packing.dest_component, packing.src_component,
636  packing.n_components, local_tags, packing.dtos, packing.proj);
637  } else
638 #endif
639  {
640  local_copy_cpu(dest, src, packing.dest_component, packing.src_component,
641  packing.n_components, local_tags, packing.dtos, packing.proj);
642  }
643 }
645 #ifdef AMREX_USE_MPI
647 template <typename FAB, typename DTOS, typename FabProj>
648 std::enable_if_t<IsBaseFab<FAB>::value>
650  FabArray<FAB>& dest, const CommData& recv) {
651  // If FAB is not FArrayBox we have not checked for the correct types yet.
652  static_assert(IsFabProjection<FabProj, FAB>(), "FabProj needs to be a projection for given FAB type.");
653 #ifdef AMREX_USE_GPU
654  if (Gpu::inLaunchRegion()) {
655  unpack_recv_buffer_gpu(dest, packing.dest_component, packing.n_components,,
656  recv.size, recv.cctc, packing.dtos, packing.proj);
657  } else
658 #endif // AMREX_USE_GPU
659  {
660  unpack_recv_buffer_cpu(dest, packing.dest_component, packing.n_components,,
661  recv.size, recv.cctc, packing.dtos, packing.proj);
662  }
663 }
664 #endif // AMREX_USE_MPI
666 static_assert(IsDataPacking<ApplyDtosAndProjectionOnReciever<>, FArrayBox>(), // NOLINT(bugprone-throw-keyword-missing)
667  "ApplyDtosAndProjectionOnReciever<> is expected to satisfy the DataPacking concept.");
670 // [ParallelCopy_nowait]
672 static constexpr struct NoLocalCopy {} no_local_copy{};
673 static constexpr struct DoLocalCopy {} do_local_copy{};
696 template <typename FAB, typename DataPacking,
697  typename = std::enable_if_t<IsBaseFab<FAB>::value>,
698  typename = std::enable_if_t<IsDataPacking<DataPacking, FAB>::value>>
699 #ifdef AMREX_USE_MPI
702  const FabArrayBase::CommMetaData& cmd, const DataPacking& data_packing) {
703  CommHandler handler{};
704  if (ParallelContext::NProcsSub() == 1) {
705  return handler;
706  }
707  //
708  // Do this before prematurely exiting if running in parallel.
709  // Otherwise sequence numbers will not match across MPI processes.
710  //
713  if (cmd.m_RcvTags && !(cmd.m_RcvTags->empty())) {
714  PrepareRecvBuffers(data_packing, dest, src, handler.recv, *cmd.m_RcvTags);
715  PostRecvs(handler.recv, handler.mpi_tag);
716  }
718  if (cmd.m_SndTags && !(cmd.m_SndTags->empty())) {
719  PrepareSendBuffers(data_packing, dest, src, handler.send, *cmd.m_SndTags);
720  PackSendBuffers(data_packing, src, handler.send);
721  PostSends(handler.send, handler.mpi_tag);
722  }
723  return handler;
724 }
725 #else
727  const FabArrayBase::CommMetaData&, const DataPacking&) {
728  return CommHandler{};
729 }
730 #endif
753 template <typename FAB, typename DataPacking,
754  typename = std::enable_if_t<IsBaseFab<FAB>::value>,
755  typename = std::enable_if_t<IsDataPacking<DataPacking, FAB>::value>>
756 #ifdef AMREX_USE_MPI
758 #endif
759 CommHandler
761  const FabArrayBase::CommMetaData& cmd, const DataPacking& data_packing) {
762  CommHandler comm = ParallelCopy_nowait(no_local_copy, dest, src, cmd, data_packing);
763  // Eagerly do the local work and hope for some overlap with communication
764  if (cmd.m_LocTags && !cmd.m_LocTags->empty()) {
765  LocalCopy(data_packing, dest, src, *cmd.m_LocTags);
766  }
767  return comm;
768 }
770 // [ParallelCopy_finish]
790 template <typename FAB, typename DataPacking>
791 std::enable_if_t<IsBaseFab<FAB>() && IsDataPacking<DataPacking, FAB>()>
792 #ifdef AMREX_USE_MPI
794  const FabArrayBase::CommMetaData& cmd, const DataPacking& data_packing) {
795  // If any FabArray is empty we have nothing to do.
796  if (dest.empty()) {
797  return;
798  }
799  // Return if nothing do
800  if (ParallelContext::NProcsSub() == 1) {
801  return;
802  }
803  // Unpack receives
804  if (cmd.m_RcvTags && !(cmd.m_RcvTags->empty())) {
806 #ifdef AMREX_DEBUG
807  if (!CheckRcvStats(handler.recv.stats, handler.recv.size, handler.mpi_tag)) {
808  amrex::Abort("NonLocalPC::ParallelCopy_finish failed with wrong message size");
809  }
810 #endif
811  UnpackRecvBuffers(data_packing, dest, handler.recv);
812  }
814  // Wait for all sends to be done
815  if (cmd.m_SndTags && !(cmd.m_SndTags->empty())) {
817  }
818 }
819 #else
821 #endif
842 template <typename FAB, typename DataPacking>
843 std::enable_if_t<IsBaseFab<FAB>() && IsDataPacking<DataPacking, FAB>()>
845  const FabArrayBase::CommMetaData& cmd, const DataPacking& data_packing) {
846  // Eagerly do the local work and hope for some overlap with communication
847  if (cmd.m_LocTags && !cmd.m_LocTags->empty()) {
848  LocalCopy(data_packing, dest, src, *cmd.m_LocTags);
849  }
850  ParallelCopy_finish(dest, std::move(handler), cmd, data_packing); // NOLINT
851 }
877 template <typename FAB, typename DTOS = Identity, typename Proj = Identity>
878 std::enable_if_t<IsBaseFab<FAB>() && IsCallableR<Dim3, DTOS, Dim3>() && IsFabProjection<Proj, FAB>()>
880  SrcComp srccomp, DestComp destcomp, NumComps numcomp, DTOS const& dtos = DTOS{}, Proj const& proj = Proj{}) {
881  PackComponents components{};
882  components.dest_component = destcomp.i;
883  components.src_component = srccomp.i;
884  components.n_components = numcomp.n;
885  ApplyDtosAndProjectionOnReciever<DTOS, Proj> packing{components, dtos, proj};
886  CommHandler handler = ParallelCopy_nowait(dest, src, cmd, packing);
887  ParallelCopy_finish(dest, std::move(handler), cmd, packing); // NOLINT
888 }
914 template <typename FAB, typename DTOS = Identity, typename Proj = Identity>
915 std::enable_if_t<IsBaseFab<FAB>() && IsCallableR<Dim3, DTOS, Dim3>() && IsFabProjection<Proj, FAB>()>
917  int srccomp, int destcomp, int numcomp, DTOS const& dtos = DTOS{}, Proj const& proj = Proj{}) {
918  ParallelCopy(dest, src, cmd, SrcComp(srccomp), DestComp(destcomp), NumComps(numcomp), dtos, proj);
919 }
950 template <typename FAB, typename DTOS = Identity, typename Proj = Identity>
951 std::enable_if_t<IsBaseFab<FAB>() && IsIndexMapping<DTOS>() && IsFabProjection<Proj, FAB>(),
952 MultiBlockCommMetaData>
953 ParallelCopy (FabArray<FAB>& dest, const Box& destbox, const FabArray<FAB>& src, SrcComp srccomp,
954  DestComp destcomp, NumComps numcomp, const IntVect& ngrow, DTOS const& dtos = DTOS{}, Proj const& proj = Proj{}) {
955  MultiBlockCommMetaData cmd(dest, destbox, src, ngrow, dtos);
956  ParallelCopy(dest, src, cmd, srccomp, destcomp, numcomp, dtos, proj);
957  return cmd;
958 }
989 template <typename FAB, typename DTOS = Identity, typename Proj = Identity>
990 std::enable_if_t<IsBaseFab<FAB>() && IsIndexMapping<DTOS>() && IsFabProjection<Proj, FAB>(),
991 MultiBlockCommMetaData>
992 ParallelCopy (FabArray<FAB>& dest, const Box& destbox, const FabArray<FAB>& src, int srccomp,
993  int destcomp, int numcomp, const IntVect& ngrow, DTOS const& dtos = DTOS{}, Proj const& proj = Proj{}) {
994  return ParallelCopy(dest, destbox, src, SrcComp(srccomp), DestComp(destcomp), NumComps(numcomp), ngrow, dtos, proj);
995 }
997 // Rotate90 fills the lo-x and lo-y boundary regions by rotating the data
998 // around (x=0,y=0) by 90 degrees in either direction. It also fills the
999 // corner of lo-x and lo-y boundary region by rotating the data by 180
1000 // degrees.
1002 template <class FAB>
1003 std::enable_if_t<IsBaseFab<FAB>::value>
1004 Rotate90 (FabArray<FAB>& mf, int scomp, int ncomp, IntVect const& nghost, Box const& domain);
1006 template <class FAB>
1007 std::enable_if_t<IsBaseFab<FAB>::value>
1008 Rotate90 (FabArray<FAB>& mf, Box const& domain);
1010 // Rotate180 fills the lo-x boundary by rotating the data around
1011 // (x=0,y=L_y/2) by 180 degrees.
1013 template <class FAB>
1014 std::enable_if_t<IsBaseFab<FAB>::value>
1015 Rotate180 (FabArray<FAB>& mf, int scomp, int ncomp, IntVect const& nghost, Box const& domain);
1017 template <class FAB>
1018 std::enable_if_t<IsBaseFab<FAB>::value>
1019 Rotate180 (FabArray<FAB>& mf, Box const& domain);
1021 // Fill the polar boundaries of the spherical coordinates (theta, phi, r).
1022 // The lo-x boundary is filled with f(-x,y) = f(x,mod(y+pi,2*pi)), and
1023 // the hi-x boundary is filled with f(pi+x,y) = f(pi-x,mod(y+pi,2*pi)).
1025 template <class FAB>
1026 std::enable_if_t<IsBaseFab<FAB>::value>
1027 FillPolar (FabArray<FAB>& mf, int scomp, int ncomp, IntVect const& nghost, Box const& domain);
1029 template <class FAB>
1030 std::enable_if_t<IsBaseFab<FAB>::value>
1031 FillPolar (FabArray<FAB>& mf, Box const& domain);
1069 template <typename FAB, typename DTOS, typename Proj = Identity>
1070 [[nodiscard]]
1071 std::enable_if_t<IsBaseFab<FAB>() &&
1074  CommHandler>
1076  int scomp, int ncomp, DTOS const& dtos,
1077  Proj const& proj = Proj{});
1114 template <typename FAB, typename DTOS, typename Proj = Identity>
1115 std::enable_if_t<IsBaseFab<FAB>() &&
1117  IsFabProjection<Proj,FAB>()>
1119  FabArray<FAB>& mf, const FabArrayBase::CommMetaData& cmd,
1120  int scomp, int ncomp, DTOS const& dtos,
1121  Proj const& proj = Proj{});
1154 template <typename FAB, typename DTOS, typename Proj = Identity>
1155 std::enable_if_t<IsBaseFab<FAB>() &&
1157  IsFabProjection<Proj,FAB>()>
1159  int scomp, int ncomp, DTOS const& dtos, Proj const& proj = Proj{})
1160 {
1161  BL_PROFILE("FillBoundary(cmd)");
1162  auto handler = FillBoundary_nowait(mf, cmd, scomp, ncomp, dtos, proj);
1163  FillBoundary_finish(std::move(handler), mf, cmd, scomp, ncomp, dtos, proj);
1164 }
1180 template <typename FAB, typename DTOS>
1181 [[nodiscard]]
1182 std::enable_if_t<IsBaseFab<FAB>() && IsCallableR<Dim3,DTOS,Dim3>(),
1183  FabArrayBase::CommMetaData>
1185  Geometry const& geom, DTOS const& dtos);
1187 }
1189 #include <AMReX_NonLocalBCImpl.H>
1191 namespace amrex {
1196  using NonLocalBC::SphThetaPhiRIndexMapping;
1197  using NonLocalBC::SphThetaPhiRComponentMapping;
1204 }
1206 #endif
