35 const Array4<Real >& tempold,
36 const Array4<Real >& tempcache,
37 const Array4<Real >& Hz,
38 const Array4<Real >& Huon,
39 const Array4<Real >& Hvom,
40 const Array4<Real >& W ,
41 const Array4<Real >& DC,
42 const Array4<Real >& FC ,
43 const Array4<Real >& tempstore,
44 const Array4<Real const>& z_w,
45 const Array4<Real const>& h,
46 const Array4<Real const>& pm,
47 const Array4<Real const>& pn,
48 const Array4<Real const>& msku,
49 const Array4<Real const>& mskv,
50 const Array4<int const>& river_pos,
51 const Array4<Real const>& river_source,
52 int iic,
int ntfirst,
int nrhs,
int N,
55 const Box& domain = geom[0].Domain();
56 const auto dlo = amrex::lbound(domain);
57 const auto dhi = amrex::ubound(domain);
59 GeometryData
const& geomdata = geom[0].data();
60 bool is_periodic_in_x = geomdata.isPeriodic(0);
61 bool is_periodic_in_y = geomdata.isPeriodic(1);
71 FArrayBox fab_FX(tbxp2,1,amrex::The_Async_Arena());
72 FArrayBox fab_FE(tbxp2,1,amrex::The_Async_Arena());
73 FArrayBox fab_curv(tbxp2,1,amrex::The_Async_Arena());
74 FArrayBox fab_grad(tbxp2,1,amrex::The_Async_Arena());
76 auto FX=fab_FX.array();
77 auto FE=fab_FE.array();
78 auto curv=fab_curv.array();
79 auto grad=fab_grad.array();
81 [=] AMREX_GPU_DEVICE (
int i,
int j,
int k)
91 Box ubx = surroundingNodes(tbx,0);
92 Box vbx = surroundingNodes(tbx,1);
94 Box utbxp1 = surroundingNodes(tbxp1,0);
95 Box vtbxp1 = surroundingNodes(tbxp1,1);
97 Box gbx3uneven_init(IntVect(AMREX_D_DECL(tbx.smallEnd(0)-3,tbx.smallEnd(1)-3,tbx.smallEnd(2))),
98 IntVect(AMREX_D_DECL(tbx.bigEnd(0)+2,tbx.bigEnd(1)+2,tbx.bigEnd(2))));
99 BoxArray ba_gbx3uneven = intersect(BoxArray(gbx3uneven_init), gbx);
100 AMREX_ASSERT((ba_gbx3uneven.size() == 1));
101 Box gbx3uneven = ba_gbx3uneven[0];
104 BoxArray ba_gbx2 = intersect(BoxArray(gbx2), gbx);
105 AMREX_ASSERT((ba_gbx2.size() == 1));
109 BoxArray ba_gbx1 = intersect(BoxArray(gbx1), gbx);
110 AMREX_ASSERT((ba_gbx1.size() == 1));
118 Box gbx3unevenD = gbx3uneven;
119 gbx3unevenD.makeSlab(2,0);
124 [=] AMREX_GPU_DEVICE (
int i,
int j,
int )
133 for(
int k=1;k<=N+1;k++) {
134 W(i,j,k) = W(i,j,k-1) - (Huon(i+1,j,k-1)-Huon(i,j,k-1)) - (Hvom(i,j+1,k-1)-Hvom(i,j,k-1));
138 [=] AMREX_GPU_DEVICE (
int i,
int j,
int )
145 Real wrk_i=W(i,j,N+1)/(z_w(i,j,N+1)+h(i,j,0,0));
147 for (
int k=1; k<=N; k++) {
148 W(i,j,k) = W(i,j,k)- wrk_i*(z_w(i,j,k)+h(i,j,0,0));
155 FArrayBox fab_stflux(tbxp2,1,amrex::The_Async_Arena());
156 auto stflux= fab_stflux.array();
157 FArrayBox fab_btflux(tbxp2,1,amrex::The_Async_Arena());
158 auto btflux= fab_btflux.array();
164 ParallelFor(tbxp2, [=] AMREX_GPU_DEVICE (
int i,
int j,
int k)
166 stflux(i,j,k)=0.0_rt;
167 btflux(i,j,k)=0.0_rt;
174 ParallelFor(tbxp1, [=] AMREX_GPU_DEVICE (
int i,
int j,
int k)
176 FX(i,j,k)=Box(tempold).contains(i-1,j,k) ? Huon(i,j,k)*
177 0.5_rt*(tempold(i-1,j,k)+tempold(i ,j,k)) : 1e34_rt;
179 ParallelFor(tbxp1, [=] AMREX_GPU_DEVICE (
int i,
int j,
int k)
181 FE(i,j,k)=Box(tempold).contains(i,j-1,k) ? Hvom(i,j,k)*
182 0.5_rt*(tempold(i,j-1,k)+tempold(i,j,k)) : 1e34_rt;
187 ParallelFor(utbxp1, [=] AMREX_GPU_DEVICE (
int i,
int j,
int k)
190 FX(i,j,k)=(tempold(i,j,k,nrhs)-tempold(i-1,j,k,nrhs)) * msku(i,j,0);
193 Box utbxp1_slab_lo = makeSlab(utbxp1,0,dlo.x-1) & utbxp1;
194 Box utbxp1_slab_hi = makeSlab(utbxp1,0,dhi.x+1) & utbxp1;
195 if (utbxp1_slab_lo.ok() && !is_periodic_in_x) {
196 ParallelFor(utbxp1_slab_lo, [=] AMREX_GPU_DEVICE (
int i,
int j,
int k)
198 FX(i,j,k) = FX(i+1,j,k);
201 if (utbxp1_slab_hi.ok() && !is_periodic_in_x) {
202 ParallelFor(utbxp1_slab_hi, [=] AMREX_GPU_DEVICE (
int i,
int j,
int k)
204 FX(i+1,j,k) = FX(i,j,k);
208 ParallelFor(vtbxp1, [=] AMREX_GPU_DEVICE (
int i,
int j,
int k)
211 FE(i,j,k)=(tempold(i,j,k,nrhs)-tempold(i,j-1,k,nrhs)) * mskv(i,j,0);
214 Box vtbxp1_slab_lo = makeSlab(vtbxp1,1,dlo.y-1) & vtbxp1;
215 Box vtbxp1_slab_hi = makeSlab(vtbxp1,1,dhi.y+1) & vtbxp1;
216 if (vtbxp1_slab_lo.ok() && !is_periodic_in_y) {
217 ParallelFor(vtbxp1_slab_lo, [=] AMREX_GPU_DEVICE (
int i,
int j,
int k)
219 FE(i,j,k) = FE(i,j+1,k);
222 if (vtbxp1_slab_hi.ok() && !is_periodic_in_y) {
223 ParallelFor(vtbxp1_slab_hi, [=] AMREX_GPU_DEVICE (
int i,
int j,
int k)
225 FE(i,j+1,k) = FE(i,j,k);
229 Real cffa=1.0_rt/6.0_rt;
230 Real cffb=1.0_rt/3.0_rt;
233 ParallelFor(tbxp1, [=] AMREX_GPU_DEVICE (
int i,
int j,
int k)
236 curv(i,j,k)=-FX(i,j,k)+FX(i+1,j,k);
239 ParallelFor(tbxp1, [=] AMREX_GPU_DEVICE (
int i,
int j,
int k)
241 Real max_Huon = std::max(Huon(i,j,k),0.0_rt);
242 Real min_Huon = std::min(Huon(i,j,k),0.0_rt);
244 FX(i,j,k)=Huon(i,j,k)*0.5_rt*(tempold(i,j,k)+tempold(i-1,j,k))-
245 cffa*(curv(i,j,k)*min_Huon+ curv(i-1,j,k)*max_Huon);
250 ParallelFor(tbxp1, [=] AMREX_GPU_DEVICE (
int i,
int j,
int k)
253 grad(i,j,k)=0.5_rt*(FX(i,j,k)+FX(i+1,j,k));
256 ParallelFor(ubx, [=] AMREX_GPU_DEVICE (
int i,
int j,
int k)
258 FX(i,j,k)=Huon(i,j,k)*0.5_rt*(tempold(i,j,k)+tempold(i-1,j,k)-
259 cffb*(grad(i,j,k)-grad(i-1,j,k)));
262 Error(
"Not a valid horizontal advection scheme");
267 ParallelFor(tbxp1, [=] AMREX_GPU_DEVICE (
int i,
int j,
int k)
269 curv(i,j,k)=-FE(i,j,k)+FE(i,j+1,k);
272 ParallelFor(tbxp1, [=] AMREX_GPU_DEVICE (
int i,
int j,
int k)
274 Real max_Hvom = std::max(Hvom(i,j,k),0.0_rt);
275 Real min_Hvom = std::min(Hvom(i,j,k),0.0_rt);
277 FE(i,j,k)=Hvom(i,j,k)*0.5_rt*(tempold(i,j,k)+tempold(i,j-1,k))-
278 cffa*(curv(i,j,k)*min_Hvom+ curv(i,j-1,k)*max_Hvom);
283 ParallelFor(tbxp1, [=] AMREX_GPU_DEVICE (
int i,
int j,
int k)
285 grad(i,j,k)=0.5_rt*(FE(i,j,k)+FE(i,j+1,k));
288 ParallelFor(vbx, [=] AMREX_GPU_DEVICE (
int i,
int j,
int k)
290 FE(i,j,k)=Hvom(i,j,k)*0.5_rt*(tempold(i,j,k)+tempold(i,j-1,k)-
291 cffb*(grad(i,j,k)- grad(i,j-1,k)));
294 Error(
"Not a valid horizontal advection scheme");
298 bool do_rivers_cons = (river_source.size() > 0);
301 ParallelFor(tbxp1, [=] AMREX_GPU_DEVICE (
int i,
int j,
int k)
303 int iriver = river_pos(i,j,0);
305 if (river_direction_d[iriver] == 0) {
306 FX(i,j,k) = (!do_rivers_cons) ? 0.0_rt : Huon(i,j,k) * river_source(iriver,0,k);
308 FE(i,j,k) = (!do_rivers_cons) ? 0.0_rt : Hvom(i,j,k) * river_source(iriver,0,k);
319 Real cff1 = 0.0_rt, cff2 = 0.0_rt, cff;
321 Real GammaT = 1.0_rt/6.0_rt;
329 cff=(1.0_rt-GammaT)*dt_lev;
334 ParallelFor(tbx, [=] AMREX_GPU_DEVICE (
int i,
int j,
int k)
336 tempstore(i,j,k)=Hz(i,j,k)*( cff1 * tempold(i,j,k)+
337 cff2 * tempcache(i,j,k) )-
338 cff * pm(i,j,0)*pn(i,j,0) * (FX(i+1,j,k)-FX(i,j,k)+
339 FE(i,j+1,k)-FE(i,j,k));
346 ParallelFor(convert(tbx,IntVect(0,0,1)), [=] AMREX_GPU_DEVICE (
int i,
int j,
int k)
353 Real c2=7.0_rt/12.0_rt;
354 Real c3=1.0_rt/12.0_rt;
358 FC(i,j,k)=( c2*(tempold(i ,j,k-1,nrhs)+ tempold(i,j,k ,nrhs))
359 -c3*(tempold(i ,j,k-2 ,nrhs)+ tempold(i,j,k+1,nrhs)) )*
366 FC(i,j,N) = ( c2*tempold(i,j,N-1,nrhs)+ c1*tempold(i,j,N,nrhs)-c3*tempold(i,j,N-2,nrhs) )
369 FC(i,j, 1) = ( c2*tempold(i,j, 1,nrhs)+ c1*tempold(i,j,0,nrhs)-c3*tempold(i,j,2,nrhs) )
376 ParallelFor(tbxp1, [=] AMREX_GPU_DEVICE (
int i,
int j,
int k)
379 DC(i,j,k)=1.0_rt/(Hz(i,j,k)-
380 cff*pm(i,j,0)*pn(i,j,0)*
381 (Huon(i+1,j,k)-Huon(i,j,k)+
382 Hvom(i,j+1,k)-Hvom(i,j,k)+
383 (W(i,j,k+1)-W(i,j,k))));
394 [=] AMREX_GPU_DEVICE (
int i,
int j,
int k)
396 Real c1 = cff*pm(i,j,0)*pn(i,j,0);
398 Real c4 = FC(i,j,k+1)-FC(i,j,k);
400 tempstore(i,j,k) = DC(i,j,k)*(tempstore(i,j,k)-c1*c4);