aboutsummaryrefslogtreecommitdiff
path: root/Source/Utils/CoarsenIO.cpp
diff options
context:
space:
mode:
Diffstat (limited to 'Source/Utils/CoarsenIO.cpp')
-rw-r--r--Source/Utils/CoarsenIO.cpp106
1 files changed, 106 insertions, 0 deletions
diff --git a/Source/Utils/CoarsenIO.cpp b/Source/Utils/CoarsenIO.cpp
new file mode 100644
index 000000000..b75d054b4
--- /dev/null
+++ b/Source/Utils/CoarsenIO.cpp
@@ -0,0 +1,106 @@
+#include "CoarsenIO.H"
+
+using namespace amrex;
+
+void
+CoarsenIO::Loop ( MultiFab& mf_dst,
+ const MultiFab& mf_src,
+ const int dcomp,
+ const int scomp,
+ const int ncomp,
+ const int ngrow,
+ const IntVect crse_ratio )
+{
+ // Staggering of source fine MultiFab and destination coarse MultiFab
+ const IntVect stag_src = mf_src.boxArray().ixType().toIntVect();
+ const IntVect stag_dst = mf_dst.boxArray().ixType().toIntVect();
+
+ if ( crse_ratio > IntVect(1) ) AMREX_ALWAYS_ASSERT_WITH_MESSAGE( ngrow == 0,
+ "option of filling guard cells of destination MultiFab with coarsening not supported for this interpolation" );
+
+ AMREX_ALWAYS_ASSERT_WITH_MESSAGE( mf_src.nGrowVect() >= stag_dst-stag_src+IntVect(ngrow),
+ "source fine MultiFab does not have enough guard cells for this interpolation" );
+
+ // Auxiliary integer arrays (always 3D)
+ Gpu::ManagedVector<int> sf_gpuarr, sc_gpuarr, cr_gpuarr;
+ sf_gpuarr.resize( 3 ); // staggering of source fine MultiFab
+ sc_gpuarr.resize( 3 ); // staggering of destination coarse MultiFab
+ cr_gpuarr.resize( 3 ); // coarsening ratio
+
+ sf_gpuarr[0] = stag_src[0];
+ sf_gpuarr[1] = stag_src[1];
+#if (AMREX_SPACEDIM == 2)
+ sf_gpuarr[2] = 0;
+#elif (AMREX_SPACEDIM == 3)
+ sf_gpuarr[2] = stag_src[2];
+#endif
+
+ sc_gpuarr[0] = stag_dst[0];
+ sc_gpuarr[1] = stag_dst[1];
+#if (AMREX_SPACEDIM == 2)
+ sc_gpuarr[2] = 0;
+#elif (AMREX_SPACEDIM == 3)
+ sc_gpuarr[2] = stag_dst[2];
+#endif
+
+ cr_gpuarr[0] = crse_ratio[0];
+ cr_gpuarr[1] = crse_ratio[1];
+#if (AMREX_SPACEDIM == 2)
+ cr_gpuarr[2] = 1;
+#elif (AMREX_SPACEDIM == 3)
+ cr_gpuarr[2] = crse_ratio[2];
+#endif
+
+ int const* const AMREX_RESTRICT sf = sf_gpuarr.data();
+ int const* const AMREX_RESTRICT sc = sc_gpuarr.data();
+ int const* const AMREX_RESTRICT cr = cr_gpuarr.data();
+
+#ifdef _OPENMP
+#pragma omp parallel if (Gpu::notInLaunchRegion())
+#endif
+ // Loop over boxes (or tiles if not on GPU)
+ for (MFIter mfi( mf_dst, TilingIfNotGPU() ); mfi.isValid(); ++mfi)
+ {
+ // Tiles defined at the coarse level
+ const Box& bx = mfi.growntilebox( ngrow );
+ Array4<Real> const& arr_dst = mf_dst.array( mfi );
+ Array4<Real const> const& arr_src = mf_src.const_array( mfi );
+ ParallelFor( bx, ncomp,
+ [=] AMREX_GPU_DEVICE( int i, int j, int k, int n )
+ {
+ arr_dst(i,j,k,n+dcomp) = CoarsenIO::Interp(
+ arr_src, sf, sc, cr, i, j, k, n+scomp );
+ } );
+ }
+}
+
+void
+CoarsenIO::Coarsen ( MultiFab& mf_dst,
+ const MultiFab& mf_src,
+ const int dcomp,
+ const int scomp,
+ const int ncomp,
+ const int ngrow,
+ const IntVect crse_ratio )
+{
+ BL_PROFILE( "CoarsenIO::Coarsen" );
+
+ // Convert BoxArray of source MultiFab to staggering of destination MultiFab and coarsen it
+ BoxArray ba_tmp = amrex::convert( mf_src.boxArray(), mf_dst.ixType().toIntVect() );
+ AMREX_ALWAYS_ASSERT_WITH_MESSAGE( ba_tmp.coarsenable( crse_ratio ),
+ "source MultiFab converted to staggering of destination MultiFab is not coarsenable" );
+ ba_tmp.coarsen( crse_ratio );
+
+ if ( ba_tmp == mf_dst.boxArray() and mf_src.DistributionMap() == mf_dst.DistributionMap() )
+ CoarsenIO::Loop( mf_dst, mf_src, dcomp, scomp, ncomp, ngrow, crse_ratio );
+ else
+ {
+ // Cannot coarsen into MultiFab with different BoxArray or DistributionMapping:
+ // 1) create temporary MultiFab on coarsened version of source BoxArray with same DistributionMapping
+ MultiFab mf_tmp( ba_tmp, mf_src.DistributionMap(), ncomp, 0, MFInfo(), FArrayBoxFactory() );
+ // 2) interpolate from mf_src to mf_tmp (start writing into component 0)
+ CoarsenIO::Loop( mf_tmp, mf_src, 0, scomp, ncomp, ngrow, crse_ratio );
+ // 3) copy from mf_tmp to mf_dst (with different BoxArray or DistributionMapping)
+ mf_dst.copy( mf_tmp, 0, dcomp, ncomp );
+ }
+}