Function for computing the slow RHS for the evolution equations for the scalars other than density or potential temperature
100 BL_PROFILE_REGION(
"erf_slow_rhs_post()");
102 const BCRec* bc_ptr_d = domain_bcs_type_d.data();
103 const BCRec* bc_ptr_h = domain_bcs_type_h.data();
109 const MultiFab* t_mean_mf =
nullptr;
110 if (most) t_mean_mf = most->get_mac_avg(level,2);
112 const bool l_use_terrain = (solverChoice.
mesh_type != MeshType::ConstantDz);
113 const bool l_moving_terrain = (solverChoice.
terrain_type == TerrainType::MovingFittedMesh);
114 const bool l_reflux = (solverChoice.
coupling_type != CouplingType::OneWay);
115 if (l_moving_terrain) AMREX_ALWAYS_ASSERT(l_use_terrain);
118 const bool l_use_KE = ( (tc.
les_type == LESType::Deardorff) ||
121 const bool l_need_SmnSmn = ( tc.
les_type == LESType::Deardorff ||
128 const bool l_use_turb = ( tc.
les_type == LESType::Smagorinsky ||
129 tc.
les_type == LESType::Deardorff ||
136 const Box& domain = geom.Domain();
138 const GpuArray<Real, AMREX_SPACEDIM> dxInv = geom.InvCellSizeArray();
139 const Real* dx = geom.CellSize();
144 const Array<Real,AMREX_SPACEDIM> grav{0.0, 0.0, -solverChoice.
gravity};
145 const GpuArray<Real,AMREX_SPACEDIM> grav_gpu{grav[0], grav[1], grav[2]};
152 const DistributionMapping& dm = S_data[
IntVars::cons].DistributionMap();
154 std::unique_ptr<MultiFab> dflux_x;
155 std::unique_ptr<MultiFab> dflux_y;
156 std::unique_ptr<MultiFab> dflux_z;
159 dflux_x = std::make_unique<MultiFab>(convert(ba,IntVect(1,0,0)), dm,
nvars, 0);
160 dflux_y = std::make_unique<MultiFab>(convert(ba,IntVect(0,1,0)), dm,
nvars, 0);
161 dflux_z = std::make_unique<MultiFab>(convert(ba,IntVect(0,0,1)), dm,
nvars, 0);
169 Vector<int> is_valid_slow_var; is_valid_slow_var.resize(
RhoQ1_comp+1,0);
170 if (l_use_KE) {is_valid_slow_var[
RhoKE_comp] = 1;}
180 Vector<Real> max_scal(nvar, 1.0e34); Gpu::DeviceVector<Real> max_scal_d(nvar);
181 Vector<Real> min_scal(nvar,-1.0e34); Gpu::DeviceVector<Real> min_scal_d(nvar);
182 if (l_use_mono_adv) {
184 for (
int ivar(
RhoKE_comp); ivar<nvar; ++ivar) {
185 GpuTuple<Real,Real> mm = ParReduce(TypeList<ReduceOpMax,ReduceOpMin>{},
186 TypeList<Real, Real>{},
188 [=] AMREX_GPU_DEVICE (
int box_no,
int i,
int j,
int k) noexcept
189 -> GpuTuple<Real,Real>
191 return { ma_s_arr[box_no](i,j,k,ivar), ma_s_arr[box_no](i,j,k,ivar) };
193 max_scal[ivar] = get<0>(mm);
194 min_scal[ivar] = get<1>(mm);
197 Gpu::copy(Gpu::hostToDevice, max_scal.begin(), max_scal.end(), max_scal_d.begin());
198 Gpu::copy(Gpu::hostToDevice, min_scal.begin(), min_scal.end(), min_scal_d.begin());
199 Real* max_s_ptr = max_scal_d.data();
200 Real* min_s_ptr = min_scal_d.data();
218 #pragma omp parallel if (Gpu::notInLaunchRegion())
221 std::array<FArrayBox,AMREX_SPACEDIM> flux;
222 std::array<FArrayBox,AMREX_SPACEDIM> flux_tmp;
227 for ( MFIter mfi(S_data[
IntVars::cons],TilingIfNotGPU()); mfi.isValid(); ++mfi) {
229 Box tbx = mfi.tilebox();
234 for (
int dir = 0; dir < AMREX_SPACEDIM; ++dir) {
235 flux[dir].resize(surroundingNodes(tbx,dir),
nvars);
236 flux[dir].setVal<RunOn::Device>(0.);
237 if (l_use_mono_adv) {
238 flux_tmp[dir].resize(surroundingNodes(tbx,dir),
nvars);
239 flux_tmp[dir].setVal<RunOn::Device>(0.);
242 const GpuArray<const Array4<Real>, AMREX_SPACEDIM>
243 flx_arr{{AMREX_D_DECL(flux[0].array(), flux[1].array(), flux[2].array())}};
244 Array4<Real> tmpx = (l_use_mono_adv) ? flux_tmp[0].array() : Array4<Real>{};
245 Array4<Real> tmpy = (l_use_mono_adv) ? flux_tmp[1].array() : Array4<Real>{};
246 Array4<Real> tmpz = (l_use_mono_adv) ? flux_tmp[2].array() : Array4<Real>{};
247 const GpuArray<Array4<Real>, AMREX_SPACEDIM> flx_tmp_arr{{AMREX_D_DECL(tmpx,tmpy,tmpz)}};
252 const Array4<const Real> & old_cons = S_old[
IntVars::cons].array(mfi);
253 const Array4< Real> & cell_rhs = S_rhs[
IntVars::cons].array(mfi);
255 const Array4< Real> & new_cons = S_new[
IntVars::cons].array(mfi);
256 const Array4< Real> & new_xmom = S_new[
IntVars::xmom].array(mfi);
257 const Array4< Real> & new_ymom = S_new[
IntVars::ymom].array(mfi);
258 const Array4< Real> & new_zmom = S_new[
IntVars::zmom].array(mfi);
260 const Array4< Real> & cur_cons = S_data[
IntVars::cons].array(mfi);
261 const Array4<const Real> & cur_prim = S_prim.array(mfi);
262 const Array4< Real> & cur_xmom = S_data[
IntVars::xmom].array(mfi);
263 const Array4< Real> & cur_ymom = S_data[
IntVars::ymom].array(mfi);
264 const Array4< Real> & cur_zmom = S_data[
IntVars::zmom].array(mfi);
270 const Array4<const Real> & u =
xvel.array(mfi);
271 const Array4<const Real> & v =
yvel.array(mfi);
273 const Array4<Real const>& mu_turb = l_use_turb ? eddyDiffs->const_array(mfi) : Array4<const Real>{};
275 const Array4<const Real>& z_nd = l_use_terrain ? z_phys_nd->const_array(mfi) : Array4<const Real>{};
276 const Array4<const Real>& detJ_new_arr = l_moving_terrain ? detJ_new->const_array(mfi) : Array4<const Real>{};
279 const Array4<const Real>& mf_m = mapfac_m->const_array(mfi);
280 const Array4<const Real>& mf_u = mapfac_u->const_array(mfi);
281 const Array4<const Real>& mf_v = mapfac_v->const_array(mfi);
284 const Array4<const Real>& SmnSmn_a = l_need_SmnSmn ? SmnSmn->const_array(mfi) : Array4<const Real>{};
290 const GpuArray<int, IntVars::NumTypes> scomp_slow = { 2,0,0,0};
291 const GpuArray<int, IntVars::NumTypes> ncomp_slow = {nsv,0,0,0};
297 [=] AMREX_GPU_DEVICE (
int i,
int j,
int k,
int nn) {
299 cur_cons(i,j,k,n) = new_cons(i,j,k,n);
306 Box tbx_inc = mfi.nodaltilebox(0);
307 Box tby_inc = mfi.nodaltilebox(1);
308 Box tbz_inc = mfi.nodaltilebox(2);
310 ParallelFor(tbx_inc, tby_inc, tbz_inc,
311 [=] AMREX_GPU_DEVICE (
int i,
int j,
int k) noexcept {
312 avg_xmom(i,j,k) = cur_xmom(i,j,k);
314 [=] AMREX_GPU_DEVICE (
int i,
int j,
int k) noexcept {
315 avg_ymom(i,j,k) = cur_ymom(i,j,k);
317 [=] AMREX_GPU_DEVICE (
int i,
int j,
int k) noexcept {
318 avg_zmom(i,j,k) = cur_zmom(i,j,k);
326 Array4<const Real> ax_arr;
327 Array4<const Real> ay_arr;
328 Array4<const Real> az_arr;
329 Array4<const Real> detJ_arr;
330 Array4<const EBCellFlag> cfg_arr;
332 EBCellFlagFab
const& cfg = ebfact.getMultiEBCellFlagFab()[mfi];
333 cfg_arr = cfg.const_array();
334 ax_arr = ebfact.getAreaFrac()[0]->const_array(mfi);
335 ay_arr = ebfact.getAreaFrac()[1]->const_array(mfi);
336 az_arr = ebfact.getAreaFrac()[2]->const_array(mfi);
337 detJ_arr = ebfact.getVolFrac().const_array(mfi);
339 ax_arr = ax->const_array(mfi);
340 ay_arr = ay->const_array(mfi);
341 az_arr = az->const_array(mfi);
342 detJ_arr = detJ->const_array(mfi);
345 AdvType horiz_adv_type, vert_adv_type;
346 Real horiz_upw_frac, vert_upw_frac;
348 Array4<Real> diffflux_x, diffflux_y, diffflux_z;
349 Array4<Real> hfx_x, hfx_y, hfx_z, diss;
350 Array4<Real> q1fx_x, q1fx_y, q1fx_z, q2fx_z;
351 const bool use_most = (most !=
nullptr);
354 diffflux_x = dflux_x->array(mfi);
355 diffflux_y = dflux_y->array(mfi);
356 diffflux_z = dflux_z->array(mfi);
358 hfx_x = Hfx1->array(mfi);
359 hfx_y = Hfx2->array(mfi);
360 hfx_z = Hfx3->array(mfi);
361 diss = Diss->array(mfi);
363 if (Q1fx1) q1fx_x = Q1fx1->array(mfi);
364 if (Q1fx2) q1fx_y = Q1fx2->array(mfi);
365 if (Q1fx3) q1fx_z = Q1fx3->array(mfi);
366 if (Q2fx3) q2fx_z = Q2fx3->array(mfi);
374 if (is_valid_slow_var[ivar])
409 cur_cons, cur_prim, cell_rhs,
410 l_use_mono_adv, max_s_ptr, min_s_ptr,
411 detJ_arr, dxInv, mf_m,
412 horiz_adv_type, vert_adv_type,
413 horiz_upw_frac, vert_upw_frac,
414 flx_arr, flx_tmp_arr, domain, bc_ptr_h);
417 avg_xmom, avg_ymom, avg_zmom,
419 cfg_arr, ax_arr, ay_arr, az_arr, detJ_arr, dxInv, mf_m,
420 horiz_adv_type, vert_adv_type,
421 horiz_upw_frac, vert_upw_frac,
422 flx_arr, domain, bc_ptr_h);
427 const Array4<const Real> tm_arr = t_mean_mf ? t_mean_mf->const_array(mfi) : Array4<const Real>{};
430 new_cons, cur_prim, cell_rhs,
431 diffflux_x, diffflux_y, diffflux_z,
432 z_nd, ax_arr, ay_arr, az_arr, detJ_arr,
433 dxInv, SmnSmn_a, mf_m, mf_u, mf_v,
434 hfx_x, hfx_y, hfx_z, q1fx_x, q1fx_y, q1fx_z,q2fx_z, diss,
435 mu_turb, solverChoice, level,
436 tm_arr, grav_gpu, bc_ptr_d, use_most);
439 new_cons, cur_prim, cell_rhs,
440 diffflux_x, diffflux_y, diffflux_z,
441 dxInv, SmnSmn_a, mf_m, mf_u, mf_v,
442 hfx_z, q1fx_z, q2fx_z, diss,
443 mu_turb, solverChoice, level,
444 tm_arr, grav_gpu, bc_ptr_d, use_most);
450 #if defined(ERF_USE_NETCDF)
451 if (moist_set_rhs_bool)
453 Box gtbx_moist = mfi.tilebox(IntVect(0),IntVect(2,2,0));
454 const Array4<const Real> & old_cons_const = S_old[
IntVars::cons].const_array(mfi);
455 const Array4<const Real> & new_cons_const = S_new[
IntVars::cons].const_array(mfi);
456 moist_set_rhs(tbx, gtbx_moist, old_cons_const, new_cons_const, cell_rhs,
457 bdy_time_interval, start_bdy_time, new_stage_time, dt, width, set_width, domain,
458 bdy_data_xlo, bdy_data_xhi, bdy_data_ylo, bdy_data_yhi);
464 BL_PROFILE(
"rhs_post_8");
466 const Real eps = std::numeric_limits<Real>::epsilon();
468 auto const& src_arr = source.const_array(mfi);
472 if (is_valid_slow_var[ivar])
482 if (l_moving_terrain)
484 ParallelFor(tbx, num_comp,
485 [=] AMREX_GPU_DEVICE (
int i,
int j,
int k,
int nn) noexcept {
486 const int n = start_comp + nn;
487 cell_rhs(i,j,k,n) += src_arr(i,j,k,n);
488 Real temp_val = detJ_arr(i,j,k) * old_cons(i,j,k,n) + dt * detJ_arr(i,j,k) * cell_rhs(i,j,k,n);
489 cur_cons(i,j,k,n) = temp_val / detJ_new_arr(i,j,k);
491 cur_cons(i,j,k,n) = amrex::max(cur_cons(i,j,k,n), eps);
497 ParallelFor(tbx, num_comp,
498 [=] AMREX_GPU_DEVICE (
int i,
int j,
int k,
int nn) noexcept {
499 const int n = start_comp + nn;
500 cell_rhs(i,j,k,n) += src_arr(i,j,k,n);
501 cur_cons(i,j,k,n) = old_cons(i,j,k,n) + dt * cell_rhs(i,j,k,n);
503 cur_cons(i,j,k,n) = amrex::max(cur_cons(i,j,k,n), eps);
505 cur_cons(i,j,k,n) = amrex::max(cur_cons(i,j,k,n), 0.0);
516 BL_PROFILE(
"rhs_post_9");
519 ParallelFor(tbx, num_comp_all,
520 [=] AMREX_GPU_DEVICE (
int i,
int j,
int k,
int n) noexcept {
521 new_cons(i,j,k,n) = cur_cons(i,j,k,n);
525 Box xtbx = mfi.nodaltilebox(0);
526 Box ytbx = mfi.nodaltilebox(1);
527 Box ztbx = mfi.nodaltilebox(2);
530 BL_PROFILE(
"rhs_post_10()");
531 ParallelFor(xtbx, ytbx, ztbx,
532 [=] AMREX_GPU_DEVICE (
int i,
int j,
int k) noexcept {
533 new_xmom(i,j,k) = cur_xmom(i,j,k);
535 [=] AMREX_GPU_DEVICE (
int i,
int j,
int k) noexcept {
536 new_ymom(i,j,k) = cur_ymom(i,j,k);
538 [=] AMREX_GPU_DEVICE (
int i,
int j,
int k) noexcept {
539 new_zmom(i,j,k) = cur_zmom(i,j,k);
544 BL_PROFILE(
"rhs_post_10");
546 if (l_reflux && nrk == 2) {
548 int num_comp_reflux =
nvars - strt_comp_reflux;
549 if (level < finest_level) {
550 fr_as_crse->CrseAdd(mfi,
551 {{AMREX_D_DECL(&(flux[0]), &(flux[1]), &(flux[2]))}},
552 dx, dt, strt_comp_reflux, strt_comp_reflux, num_comp_reflux, RunOn::Device);
555 fr_as_fine->FineAdd(mfi,
556 {{AMREX_D_DECL(&(flux[0]), &(flux[1]), &(flux[2]))}},
557 dx, dt, strt_comp_reflux, strt_comp_reflux, num_comp_reflux, RunOn::Device);
563 Gpu::streamSynchronize();
void AdvectionSrcForScalars(const amrex::Real &dt, const amrex::Box &bx, const int icomp, const int ncomp, const amrex::Array4< const amrex::Real > &avg_xmom, const amrex::Array4< const amrex::Real > &avg_ymom, const amrex::Array4< const amrex::Real > &avg_zmom, const amrex::Array4< const amrex::Real > &cur_cons, const amrex::Array4< const amrex::Real > &cell_prim, const amrex::Array4< amrex::Real > &src, const bool &use_mono_adv, amrex::Real *max_s_ptr, amrex::Real *min_s_ptr, const amrex::Array4< const amrex::Real > &vf_arr, const amrex::GpuArray< amrex::Real, AMREX_SPACEDIM > &cellSizeInv, const amrex::Array4< const amrex::Real > &mf_m, const AdvType horiz_adv_type, const AdvType vert_adv_type, const amrex::Real horiz_upw_frac, const amrex::Real vert_upw_frac, const amrex::GpuArray< const amrex::Array4< amrex::Real >, AMREX_SPACEDIM > &flx_arr, const amrex::GpuArray< amrex::Array4< amrex::Real >, AMREX_SPACEDIM > &flx_tmp_arr, const amrex::Box &domain, const amrex::BCRec *bc_ptr_h)
AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE AdvType EfficientAdvType(int nrk, AdvType adv_type)
Definition: ERF_Advection.H:254
@ nvars
Definition: ERF_DataStruct.H:74
void DiffusionSrcForState_N(const amrex::Box &bx, const amrex::Box &domain, int start_comp, int num_comp, const bool &exp_most, const amrex::Array4< const amrex::Real > &u, const amrex::Array4< const amrex::Real > &v, const amrex::Array4< const amrex::Real > &cell_data, const amrex::Array4< const amrex::Real > &cell_prim, const amrex::Array4< amrex::Real > &cell_rhs, const amrex::Array4< amrex::Real > &xflux, const amrex::Array4< amrex::Real > &yflux, const amrex::Array4< amrex::Real > &zflux, const amrex::GpuArray< amrex::Real, AMREX_SPACEDIM > &cellSizeInv, const amrex::Array4< const amrex::Real > &SmnSmn_a, const amrex::Array4< const amrex::Real > &mf_m, const amrex::Array4< const amrex::Real > &mf_u, const amrex::Array4< const amrex::Real > &mf_v, amrex::Array4< amrex::Real > &hfx_z, amrex::Array4< amrex::Real > &qfx1_z, amrex::Array4< amrex::Real > &qfx2_z, amrex::Array4< amrex::Real > &diss, const amrex::Array4< const amrex::Real > &mu_turb, const SolverChoice &solverChoice, const int level, const amrex::Array4< const amrex::Real > &tm_arr, const amrex::GpuArray< amrex::Real, AMREX_SPACEDIM > grav_gpu, const amrex::BCRec *bc_ptr, const bool use_most)
void DiffusionSrcForState_T(const amrex::Box &bx, const amrex::Box &domain, int start_comp, int num_comp, const bool &exp_most, const bool &rot_most, const amrex::Array4< const amrex::Real > &u, const amrex::Array4< const amrex::Real > &v, const amrex::Array4< const amrex::Real > &cell_data, const amrex::Array4< const amrex::Real > &cell_prim, const amrex::Array4< amrex::Real > &cell_rhs, const amrex::Array4< amrex::Real > &xflux, const amrex::Array4< amrex::Real > &yflux, const amrex::Array4< amrex::Real > &zflux, const amrex::Array4< const amrex::Real > &z_nd, const amrex::Array4< const amrex::Real > &ax, const amrex::Array4< const amrex::Real > &ay, const amrex::Array4< const amrex::Real > &az, const amrex::Array4< const amrex::Real > &detJ, const amrex::GpuArray< amrex::Real, AMREX_SPACEDIM > &dxInv, const amrex::Array4< const amrex::Real > &SmnSmn_a, const amrex::Array4< const amrex::Real > &mf_m, const amrex::Array4< const amrex::Real > &mf_u, const amrex::Array4< const amrex::Real > &mf_v, amrex::Array4< amrex::Real > &hfx_x, amrex::Array4< amrex::Real > &hfx_y, amrex::Array4< amrex::Real > &hfx_z, amrex::Array4< amrex::Real > &qfx1_x, amrex::Array4< amrex::Real > &qfx1_y, amrex::Array4< amrex::Real > &qfx1_z, amrex::Array4< amrex::Real > &qfx2_z, amrex::Array4< amrex::Real > &diss, const amrex::Array4< const amrex::Real > &mu_turb, const SolverChoice &solverChoice, const int level, const amrex::Array4< const amrex::Real > &tm_arr, const amrex::GpuArray< amrex::Real, AMREX_SPACEDIM > grav_gpu, const amrex::BCRec *bc_ptr, const bool use_most)
void EBAdvectionSrcForScalars(const amrex::Box &bx, const int icomp, const int ncomp, const amrex::Array4< const amrex::Real > &avg_xmom, const amrex::Array4< const amrex::Real > &avg_ymom, const amrex::Array4< const amrex::Real > &avg_zmom, const amrex::Array4< const amrex::Real > &cell_prim, const amrex::Array4< amrex::Real > &src, const amrex::Array4< const amrex::EBCellFlag > &cfg_arr, const amrex::Array4< const amrex::Real > &ax_arr, const amrex::Array4< const amrex::Real > &ay_arr, const amrex::Array4< const amrex::Real > &az_arr, const amrex::Array4< const amrex::Real > &vf_arr, const amrex::GpuArray< amrex::Real, AMREX_SPACEDIM > &cellSizeInv, const amrex::Array4< const amrex::Real > &mf_m, const AdvType horiz_adv_type, const AdvType vert_adv_type, const amrex::Real horiz_upw_frac, const amrex::Real vert_upw_frac, const amrex::GpuArray< const amrex::Array4< amrex::Real >, AMREX_SPACEDIM > &flx_arr, const amrex::Box &domain, const amrex::BCRec *bc_ptr_h)
#define RhoScalar_comp
Definition: ERF_IndexDefines.H:40
#define RhoTheta_comp
Definition: ERF_IndexDefines.H:37
#define RhoQ1_comp
Definition: ERF_IndexDefines.H:42
AdvType
Definition: ERF_IndexDefines.H:202
#define RhoKE_comp
Definition: ERF_IndexDefines.H:38
@ ymom
Definition: ERF_IndexDefines.H:152
@ cons
Definition: ERF_IndexDefines.H:150
@ zmom
Definition: ERF_IndexDefines.H:153
@ xmom
Definition: ERF_IndexDefines.H:151
@ xvel
Definition: ERF_IndexDefines.H:141
@ yvel
Definition: ERF_IndexDefines.H:142
Definition: ERF_AdvStruct.H:19
amrex::Real dryscal_vert_upw_frac
Definition: ERF_AdvStruct.H:292
AdvType moistscal_horiz_adv_type
Definition: ERF_AdvStruct.H:283
AdvType moistscal_vert_adv_type
Definition: ERF_AdvStruct.H:284
amrex::Real moistscal_vert_upw_frac
Definition: ERF_AdvStruct.H:294
bool use_efficient_advection
Definition: ERF_AdvStruct.H:278
amrex::Real moistscal_horiz_upw_frac
Definition: ERF_AdvStruct.H:293
AdvType dryscal_horiz_adv_type
Definition: ERF_AdvStruct.H:281
AdvType dryscal_vert_adv_type
Definition: ERF_AdvStruct.H:282
amrex::Real dryscal_horiz_upw_frac
Definition: ERF_AdvStruct.H:291
Definition: ERF_DiffStruct.H:19
MolecDiffType molec_diff_type
Definition: ERF_DiffStruct.H:81
bool use_explicit_most
Definition: ERF_DataStruct.H:692
static MeshType mesh_type
Definition: ERF_DataStruct.H:620
bool use_mono_adv
Definition: ERF_DataStruct.H:708
DiffChoice diffChoice
Definition: ERF_DataStruct.H:629
amrex::Real gravity
Definition: ERF_DataStruct.H:664
amrex::Vector< TurbChoice > turbChoice
Definition: ERF_DataStruct.H:631
amrex::Vector< int > anelastic
Definition: ERF_DataStruct.H:636
AdvChoice advChoice
Definition: ERF_DataStruct.H:628
MoistureType moisture_type
Definition: ERF_DataStruct.H:711
static TerrainType terrain_type
Definition: ERF_DataStruct.H:617
bool use_rotate_most
Definition: ERF_DataStruct.H:695
CouplingType coupling_type
Definition: ERF_DataStruct.H:710
Definition: ERF_TurbStruct.H:31
PBLType pbl_type
Definition: ERF_TurbStruct.H:238
bool use_KE
Definition: ERF_TurbStruct.H:252
RANSType rans_type
Definition: ERF_TurbStruct.H:235
LESType les_type
Definition: ERF_TurbStruct.H:202
bool advect_KE
Definition: ERF_TurbStruct.H:254