2 files changed, 268 insertions, 255 deletions
diff --git a/Source/Particles/Deposition/CurrentDeposition.H b/Source/Particles/Deposition/CurrentDeposition.H
index 58621c76b..df6481fd8 100644
--- a/Source/Particles/Deposition/CurrentDeposition.H
+++ b/Source/Particles/Deposition/CurrentDeposition.H
@@ -54,133 +54,86 @@ void doDepositionShapeN(const amrex::Real * const xp,
     const amrex::Real clightsq = 1.0/PhysConst::c/PhysConst::c;
 
     // Loop over particles and deposit into jx_arr, jy_arr and jz_arr
-    ParallelFor( np_to_depose,
-                 [=] AMREX_GPU_DEVICE (long ip) {
-                     // --- Get particle quantities
-                     const amrex::Real gaminv = 1.0/std::sqrt(1.0 + uxp[ip]*uxp[ip]*clightsq
-                                                       + uyp[ip]*uyp[ip]*clightsq
-                                                       + uzp[ip]*uzp[ip]*clightsq);
-                     const amrex::Real wq  = q*wp[ip];
-                     const amrex::Real vx  = uxp[ip]*gaminv;
-                     const amrex::Real vy  = uyp[ip]*gaminv;
-                     const amrex::Real vz  = uzp[ip]*gaminv;
-                     // wqx, wqy wqz are particle current in each direction 
-                     const amrex::Real wqx = wq*invvol*vx;
-                     const amrex::Real wqy = wq*invvol*vy;
-                     const amrex::Real wqz = wq*invvol*vz;
+    amrex::ParallelFor(
+        np_to_depose,
+        [=] AMREX_GPU_DEVICE (long ip) {
+            // --- Get particle quantities
+            const amrex::Real gaminv = 1.0/std::sqrt(1.0 + uxp[ip]*uxp[ip]*clightsq
+                                                     + uyp[ip]*uyp[ip]*clightsq
+                                                     + uzp[ip]*uzp[ip]*clightsq);
+            const amrex::Real wq  = q*wp[ip];
+            const amrex::Real vx  = uxp[ip]*gaminv;
+            const amrex::Real vy  = uyp[ip]*gaminv;
+            const amrex::Real vz  = uzp[ip]*gaminv;
+            // wqx, wqy wqz are particle current in each direction 
+            const amrex::Real wqx = wq*invvol*vx;
+            const amrex::Real wqy = wq*invvol*vy;
+            const amrex::Real wqz = wq*invvol*vz;
 
-                     // --- Compute shape factors
-                     // x direction
-                     // Get particle position after 1/2 push back in position
-                     const amrex::Real xmid = (xp[ip]-xmin)*dxi-dts2dx*vx;
-                     // Compute shape factors for node-centered quantities
-                     amrex::Real AMREX_RESTRICT sx [depos_order + 1];
-                     // j: leftmost grid point (node-centered) that the particle touches
-                     const int j  = compute_shape_factor<depos_order>(sx,  xmid);
-                     // Compute shape factors for cell-centered quantities
-                     amrex::Real AMREX_RESTRICT sx0[depos_order + 1];
-                     // j0: leftmost grid point (cell-centered) that the particle touches
-                     const int j0 = compute_shape_factor<depos_order>(sx0, xmid-stagger_shift);
+            // --- Compute shape factors
+            // x direction
+            // Get particle position after 1/2 push back in position
+            const amrex::Real xmid = (xp[ip]-xmin)*dxi-dts2dx*vx;
+            // Compute shape factors for node-centered quantities
+            amrex::Real AMREX_RESTRICT sx [depos_order + 1];
+            // j: leftmost grid point (node-centered) that the particle touches
+            const int j  = compute_shape_factor<depos_order>(sx,  xmid);
+            // Compute shape factors for cell-centered quantities
+            amrex::Real AMREX_RESTRICT sx0[depos_order + 1];
+            // j0: leftmost grid point (cell-centered) that the particle touches
+            const int j0 = compute_shape_factor<depos_order>(sx0, xmid-stagger_shift);
                      
 #if (AMREX_SPACEDIM == 3)
-                     // y direction
-                     const amrex::Real ymid= (yp[ip]-ymin)*dyi-dts2dy*vy;
-                     amrex::Real AMREX_RESTRICT sy [depos_order + 1];
-                     const int k  = compute_shape_factor<depos_order>(sy,  ymid);
-                     amrex::Real AMREX_RESTRICT sy0[depos_order + 1];
-                     const int k0 = compute_shape_factor<depos_order>(sy0, ymid-stagger_shift);
+            // y direction
+            const amrex::Real ymid= (yp[ip]-ymin)*dyi-dts2dy*vy;
+            amrex::Real AMREX_RESTRICT sy [depos_order + 1];
+            const int k  = compute_shape_factor<depos_order>(sy,  ymid);
+            amrex::Real AMREX_RESTRICT sy0[depos_order + 1];
+            const int k0 = compute_shape_factor<depos_order>(sy0, ymid-stagger_shift);
 #endif
-                     // z direction
-                     const amrex::Real zmid= (zp[ip]-zmin)*dzi-dts2dz*vz;
-                     amrex::Real AMREX_RESTRICT sz [depos_order + 1];
-                     const int l  = compute_shape_factor<depos_order>(sz,  zmid);
-                     amrex::Real AMREX_RESTRICT sz0[depos_order + 1];
-                     const int l0 = compute_shape_factor<depos_order>(sz0, zmid-stagger_shift);
+            // z direction
+            const amrex::Real zmid= (zp[ip]-zmin)*dzi-dts2dz*vz;
+            amrex::Real AMREX_RESTRICT sz [depos_order + 1];
+            const int l  = compute_shape_factor<depos_order>(sz,  zmid);
+            amrex::Real AMREX_RESTRICT sz0[depos_order + 1];
+            const int l0 = compute_shape_factor<depos_order>(sz0, zmid-stagger_shift);
 
-                     // Deposit current into jx_arr, jy_arr and jz_arr
+            // Deposit current into jx_arr, jy_arr and jz_arr
 #if (AMREX_SPACEDIM == 2)
-                     for (int iz=0; iz<=depos_order; iz++){
-                         for (int ix=0; ix<=depos_order; ix++){
-                             amrex::Gpu::Atomic::Add(
-                                 &jx_arr(lo.x+j0+ix, lo.y+l +iz, 0), 
-                                 sx0[ix]*sz [iz]*wqx);
-                             amrex::Gpu::Atomic::Add(
-                                 &jy_arr(lo.x+j +ix, lo.y+l +iz, 0), 
-                                 sx [ix]*sz [iz]*wqy);
-                             amrex::Gpu::Atomic::Add(
-                                 &jz_arr(lo.x+j +ix, lo.y+l0+iz, 0), 
-                                 sx [ix]*sz0[iz]*wqz);
-                         }
-                     }
+            for (int iz=0; iz<=depos_order; iz++){
+                for (int ix=0; ix<=depos_order; ix++){
+                    amrex::Gpu::Atomic::Add(
+                        &jx_arr(lo.x+j0+ix, lo.y+l +iz, 0), 
+                        sx0[ix]*sz [iz]*wqx);
+                    amrex::Gpu::Atomic::Add(
+                        &jy_arr(lo.x+j +ix, lo.y+l +iz, 0), 
+                        sx [ix]*sz [iz]*wqy);
+                    amrex::Gpu::Atomic::Add(
+                        &jz_arr(lo.x+j +ix, lo.y+l0+iz, 0), 
+                        sx [ix]*sz0[iz]*wqz);
+                }
+            }
 #else // (AMREX_SPACEDIM == 3)
-                     for (int iz=0; iz<=depos_order; iz++){
-                         for (int iy=0; iy<=depos_order; iy++){
-                             for (int ix=0; ix<=depos_order; ix++){
-                                 amrex::Gpu::Atomic::Add(
-                                     &jx_arr(lo.x+j0+ix, lo.y+k +iy, lo.z+l +iz),
-                                     sx0[ix]*sy [iy]*sz [iz]*wqx);
-                                 amrex::Gpu::Atomic::Add(
-                                     &jy_arr(lo.x+j +ix, lo.y+k0+iy, lo.z+l +iz), 
-                                     sx [ix]*sy0[iy]*sz [iz]*wqy);
-                                 amrex::Gpu::Atomic::Add(
-                                     &jz_arr(lo.x+j +ix, lo.y+k +iy, lo.z+l0+iz),
-                                     sx [ix]*sy [iy]*sz0[iz]*wqz);
-                             }
-                         }
-                     }
+            for (int iz=0; iz<=depos_order; iz++){
+                for (int iy=0; iy<=depos_order; iy++){
+                    for (int ix=0; ix<=depos_order; ix++){
+                        amrex::Gpu::Atomic::Add(
+                            &jx_arr(lo.x+j0+ix, lo.y+k +iy, lo.z+l +iz),
+                            sx0[ix]*sy [iy]*sz [iz]*wqx);
+                        amrex::Gpu::Atomic::Add(
+                            &jy_arr(lo.x+j +ix, lo.y+k0+iy, lo.z+l +iz), 
+                            sx [ix]*sy0[iy]*sz [iz]*wqy);
+                        amrex::Gpu::Atomic::Add(
+                            &jz_arr(lo.x+j +ix, lo.y+k +iy, lo.z+l0+iz),
+                            sx [ix]*sy [iy]*sz0[iz]*wqz);
+                    }
+                }
+            }
 #endif
-                 }
+        }
         );
 }
 
-// Compute shape factor and return index of leftmost cell where
-// particle writes.
-// Specialized templates are defined below for orders 1, 2 and 3.
-template <int depos_order>
-AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-int compute_shifted_shape_factor (Real* const sx, const Real x_old, const int i_new);
-
-// Compute shape factor for order 1.
-template <>
-AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-int compute_shifted_shape_factor <1> (Real* const sx, const Real x_old, const int i_new){
-    const int i = (int) x_old;
-    const int i_shift = i - i_new;
-    const Real xint = x_old - i;
-    sx[1+i_shift] = 1.0 - xint;
-    sx[2+i_shift] = xint;
-    return i;
-}
-
-// Compute shape factor for order 2.
-template <>
-AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-int compute_shifted_shape_factor <2> (Real* const sx, const Real x_old, const int i_new){
-    const int i = (int) (x_old+0.5);
-    const int i_shift = i - (i_new + 1);
-    const Real xint = x_old - i;
-    sx[1+i_shift] = 0.5*(0.5-xint)*(0.5-xint);
-    sx[2+i_shift] = 0.75-xint*xint;
-    sx[3+i_shift] = 0.5*(0.5+xint)*(0.5+xint);
-    // index of the leftmost cell where particle deposits
-    return i-1;
-}
-
-// Compute shape factor for order 3.
-template <>
-AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-int compute_shifted_shape_factor <3> (Real* const sx, const Real x_old, const int i_new){
-    const int i = (int) x_old;
-    const int i_shift = i - (i_new + 1);
-    const Real xint = x_old - i;
-    sx[1+i_shift] = 1.0/6.0*(1.0-xint)*(1.0-xint)*(1.0-xint);
-    sx[2+i_shift] = 2.0/3.0-xint*xint*(1-xint/2.0);
-    sx[3+i_shift] = 2.0/3.0-(1-xint)*(1-xint)*(1.0-0.5*(1-xint));
-    sx[4+i_shift] = 1.0/6.0*xint*xint*xint;
-    // index of the leftmost cell where particle deposits
-    return i-1;
-}
-
 /* \brief Esirkepov Current Deposition for thread thread_num
  * /param xp, yp, zp   : Pointer to arrays of particle positions.
  * \param wp           : Pointer to array of particle weights.
@@ -196,170 +149,173 @@ int compute_shifted_shape_factor <3> (Real* const sx, const Real x_old, const in
  * /param q            : species charge.
  */
 template <int depos_order>
-void doEsirkepovDepositionShapeN (const Real * const xp, const Real * const yp, const Real * const zp,
-                                  const Real * const wp, const Real * const uxp,
-                                  const Real * const uyp, const Real * const uzp,
+void doEsirkepovDepositionShapeN (const amrex::Real * const xp,
+                                  const amrex::Real * const yp,
+                                  const amrex::Real * const zp,
+                                  const amrex::Real * const wp,
+                                  const amrex::Real * const uxp,
+                                  const amrex::Real * const uyp,
+                                  const amrex::Real * const uzp,
                                   const amrex::Array4<amrex::Real>& Jx_arr,
                                   const amrex::Array4<amrex::Real>& Jy_arr,
                                   const amrex::Array4<amrex::Real>& Jz_arr,
                                   const long np_to_depose,
-                                  const amrex::Real dt, const std::array<amrex::Real,3>& dx,
-                                  const std::array<Real, 3> xyzmin,
-                                  const Dim3 lo,
+                                  const amrex::Real dt,
+                                  const std::array<amrex::Real,3>& dx,
+                                  const std::array<amrex::Real, 3> xyzmin,
+                                  const amrex::Dim3 lo,
                                   const amrex::Real q)
 {
-    const Real dxi = 1.0/dx[0];
-    const Real dtsdx0 = dt*dxi;
-    const Real xmin = xyzmin[0];
+    const amrex::Real dxi = 1.0/dx[0];
+    const amrex::Real dtsdx0 = dt*dxi;
+    const amrex::Real xmin = xyzmin[0];
 #if (AMREX_SPACEDIM == 3)
-    const Real dyi = 1.0/dx[1];
-    const Real dtsdy0 = dt*dyi;
-    const Real ymin = xyzmin[1];
+    const amrex::Real dyi = 1.0/dx[1];
+    const amrex::Real dtsdy0 = dt*dyi;
+    const amrex::Real ymin = xyzmin[1];
 #endif
-    const Real dzi = 1.0/dx[2];
-    const Real dtsdz0 = dt*dzi;
-    const Real zmin = xyzmin[2];
+    const amrex::Real dzi = 1.0/dx[2];
+    const amrex::Real dtsdz0 = dt*dzi;
+    const amrex::Real zmin = xyzmin[2];
 
 #if (AMREX_SPACEDIM == 3)
-    const Real invdtdx = 1.0/(dt*dx[1]*dx[2]);
-    const Real invdtdy = 1.0/(dt*dx[0]*dx[2]);
-    const Real invdtdz = 1.0/(dt*dx[0]*dx[1]);
+    const amrex::Real invdtdx = 1.0/(dt*dx[1]*dx[2]);
+    const amrex::Real invdtdy = 1.0/(dt*dx[0]*dx[2]);
+    const amrex::Real invdtdz = 1.0/(dt*dx[0]*dx[1]);
 #elif (AMREX_SPACEDIM == 2)
-    const Real invdtdx = 1.0/(dt*dx[2]);
-    const Real invdtdz = 1.0/(dt*dx[0]);
-    const Real invvol = 1.0/(dx[0]*dx[2]);
+    const amrex::Real invdtdx = 1.0/(dt*dx[2]);
+    const amrex::Real invdtdz = 1.0/(dt*dx[0]);
+    const amrex::Real invvol = 1.0/(dx[0]*dx[2]);
 #endif
 
-    const Real clightsq = 1.0/PhysConst::c/PhysConst::c;
+    const amrex::Real clightsq = 1.0/PhysConst::c/PhysConst::c;
 
     // Loop over particles and deposit into Jx_arr, Jy_arr and Jz_arr
-    ParallelFor( np_to_depose,
-                 [=] AMREX_GPU_DEVICE (long ip) {
+    ParallelFor( 
+        np_to_depose,
+        [=] AMREX_GPU_DEVICE (long ip) {
 
-                     // --- Get particle quantities
-                     const Real gaminv = 1.0/std::sqrt(1.0 + uxp[ip]*uxp[ip]*clightsq
-                                                           + uyp[ip]*uyp[ip]*clightsq
-                                                           + uzp[ip]*uzp[ip]*clightsq);
+            // --- Get particle quantities
+            const amrex::Real gaminv = 1.0/std::sqrt(1.0 + uxp[ip]*uxp[ip]*clightsq
+                                                     + uyp[ip]*uyp[ip]*clightsq
+                                                     + uzp[ip]*uzp[ip]*clightsq);
 
-                     // wqx, wqy wqz are particle current in each direction
-                     const Real wq = q*wp[ip];
-                     const Real wqx = wq*invdtdx;
+            // wqx, wqy wqz are particle current in each direction
+            const amrex::Real wq = q*wp[ip];
+            const amrex::Real wqx = wq*invdtdx;
 #if (AMREX_SPACEDIM == 3)
-                     const Real wqy = wq*invdtdy;
+            const amrex::Real wqy = wq*invdtdy;
 #endif
-                     const Real wqz = wq*invdtdz;
+            const amrex::Real wqz = wq*invdtdz;
 
-                     // computes current and old position in grid units
-                     const Real x_new = (xp[ip] - xmin)*dxi;
-                     const Real x_old = x_new - dtsdx0*uxp[ip]*gaminv;
+            // computes current and old position in grid units
+            const amrex::Real x_new = (xp[ip] - xmin)*dxi;
+            const amrex::Real x_old = x_new - dtsdx0*uxp[ip]*gaminv;
 #if (AMREX_SPACEDIM == 3)        
-                     const Real y_new = (yp[ip] - ymin)*dyi;
-                     const Real y_old = y_new - dtsdy0*uyp[ip]*gaminv;
+            const amrex::Real y_new = (yp[ip] - ymin)*dyi;
+            const amrex::Real y_old = y_new - dtsdy0*uyp[ip]*gaminv;
 #endif
-                     const Real z_new = (zp[ip] - zmin)*dzi;
-                     const Real z_old = z_new - dtsdz0*uzp[ip]*gaminv;
+            const amrex::Real z_new = (zp[ip] - zmin)*dzi;
+            const amrex::Real z_old = z_new - dtsdz0*uzp[ip]*gaminv;
 
-                     // Shape factor arrays
-                     // Note that there are extra values above and below
-                     // to possibly hold the factor for the old particle
-                     // which can be at a different grid location.
-                     Real AMREX_RESTRICT sx_new[depos_order + 3] = {0.};
-                     Real AMREX_RESTRICT sx_old[depos_order + 3] = {0.};
+            // Shape factor arrays
+            // Note that there are extra values above and below
+            // to possibly hold the factor for the old particle
+            // which can be at a different grid location.
+            amrex::Real AMREX_RESTRICT sx_new[depos_order + 3] = {0.};
+            amrex::Real AMREX_RESTRICT sx_old[depos_order + 3] = {0.};
 #if (AMREX_SPACEDIM == 3)
-                     Real AMREX_RESTRICT sy_new[depos_order + 3] = {0.};
-                     Real AMREX_RESTRICT sy_old[depos_order + 3] = {0.};
+            amrex::Real AMREX_RESTRICT sy_new[depos_order + 3] = {0.};
+            amrex::Real AMREX_RESTRICT sy_old[depos_order + 3] = {0.};
 #endif
-                     Real AMREX_RESTRICT sz_new[depos_order + 3] = {0.};
-                     Real AMREX_RESTRICT sz_old[depos_order + 3] = {0.};
+            amrex::Real AMREX_RESTRICT sz_new[depos_order + 3] = {0.};
+            amrex::Real AMREX_RESTRICT sz_old[depos_order + 3] = {0.};
 
-                     // --- Compute shape factors
-                     // Compute shape factors for position as they are now and at old positions
-                     // [ijk]_new: leftmost grid point that the particle touches
-                     const int i_new = compute_shape_factor<depos_order>(sx_new+1, x_new);
-                     const int i_old = compute_shifted_shape_factor<depos_order>(sx_old, x_old, i_new);
+            // --- Compute shape factors
+            // Compute shape factors for position as they are now and at old positions
+            // [ijk]_new: leftmost grid point that the particle touches
+            const int i_new = compute_shape_factor<depos_order>(sx_new+1, x_new);
+            const int i_old = compute_shifted_shape_factor<depos_order>(sx_old, x_old, i_new);
 #if (AMREX_SPACEDIM == 3)
-                     const int j_new = compute_shape_factor<depos_order>(sy_new+1, y_new);
-                     const int j_old = compute_shifted_shape_factor<depos_order>(sy_old, y_old, j_new);
+            const int j_new = compute_shape_factor<depos_order>(sy_new+1, y_new);
+            const int j_old = compute_shifted_shape_factor<depos_order>(sy_old, y_old, j_new);
 #endif 
-                     const int k_new = compute_shape_factor<depos_order>(sz_new+1, z_new);
-                     const int k_old = compute_shifted_shape_factor<depos_order>(sz_old, z_old, k_new);
+            const int k_new = compute_shape_factor<depos_order>(sz_new+1, z_new);
+            const int k_old = compute_shifted_shape_factor<depos_order>(sz_old, z_old, k_new);
 
-                     // computes min/max positions of current contributions
-                     int dil = 1, diu = 1;
-                     if (i_old < i_new) dil = 0;
-                     if (i_old > i_new) diu = 0;
+            // computes min/max positions of current contributions
+            int dil = 1, diu = 1;
+            if (i_old < i_new) dil = 0;
+            if (i_old > i_new) diu = 0;
 #if (AMREX_SPACEDIM == 3)
-                     int djl = 1, dju = 1;
-                     if (j_old < j_new) djl = 0;
-                     if (j_old > j_new) dju = 0;
+            int djl = 1, dju = 1;
+            if (j_old < j_new) djl = 0;
+            if (j_old > j_new) dju = 0;
 #endif
-                     int dkl = 1, dku = 1;
-                     if (k_old < k_new) dkl = 0;
-                     if (k_old > k_new) dku = 0;
+            int dkl = 1, dku = 1;
+            if (k_old < k_new) dkl = 0;
+            if (k_old > k_new) dku = 0;
 
 #if (AMREX_SPACEDIM == 3)
 
-                     for (int k=dkl; k<=depos_order+2-dku; k++) {
-                         for (int j=djl; j<=depos_order+2-dju; j++) {
-                             Real sdxi = 0.;
-                             for (int i=dil; i<=depos_order+1-diu; i++) {
-                                 sdxi += wqx*(sx_old[i] - sx_new[i])*((sy_new[j] + 0.5*(sy_old[j] - sy_new[j]))*sz_new[k] +
-                                         (0.5*sy_new[j] + 1./3.*(sy_old[j] - sy_new[j]))*(sz_old[k] - sz_new[k]));
-                                 amrex::Gpu::Atomic::Add( &Jx_arr(lo.x+i_new-1+i, lo.y+j_new-1+j, lo.z+k_new-1+k), sdxi);
-                             }
-                         }
-                     }
-                     for (int k=dkl; k<=depos_order+2-dku; k++) {
-                         for (int i=dil; i<=depos_order+2-diu; i++) {
-                             Real sdyj = 0.;
-                             for (int j=djl; j<=depos_order+1-dju; j++) {
-                                 sdyj += wqy*(sy_old[j] - sy_new[j])*((sz_new[k] + 0.5*(sz_old[k] - sz_new[k]))*sx_new[i] +
-                                         (0.5*sz_new[k] + 1./3.*(sz_old[k] - sz_new[k]))*(sx_old[i] - sx_new[i]));
-                                 amrex::Gpu::Atomic::Add( &Jy_arr(lo.x+i_new-1+i, lo.y+j_new-1+j, lo.z+k_new-1+k), sdyj);
-                             }
-                         }
-                     }
-                     for (int j=djl; j<=depos_order+2-dju; j++) {
-                         for (int i=dil; i<=depos_order+2-diu; i++) {
-                             Real sdzk = 0.;
-                             for (int k=dkl; k<=depos_order+1-dku; k++) {
-                                 sdzk += wqz*(sz_old[k] - sz_new[k])*((sx_new[i] + 0.5*(sx_old[i] - sx_new[i]))*sy_new[j] +
-                                         (0.5*sx_new[i] + 1./3.*(sx_old[i] - sx_new[i]))*(sy_old[j] - sy_new[j]));
-                                 amrex::Gpu::Atomic::Add( &Jz_arr(lo.x+i_new-1+i, lo.y+j_new-1+j, lo.z+k_new-1+k), sdzk);
-                             }
-                         }
-                     }
-
-#elif (AMREX_SPACEDIM == 2)
-
-                    for (int k=dkl; k<=depos_order+2-dku; k++) {
-                        Real sdxi = 0.;
-                        for (int i=dil; i<=depos_order+1-diu; i++) {
-                            sdxi += wqx*(sx_old[i] - sx_new[i])*(sz_new[k] + 0.5*(sz_old[k] - sz_new[k]));
-                            amrex::Gpu::Atomic::Add( &Jx_arr(lo.x+i_new-1+i, lo.y+k_new-1+k, 0), sdxi);
-                        }
+            for (int k=dkl; k<=depos_order+2-dku; k++) {
+                for (int j=djl; j<=depos_order+2-dju; j++) {
+                    amrex::Real sdxi = 0.;
+                    for (int i=dil; i<=depos_order+1-diu; i++) {
+                        sdxi += wqx*(sx_old[i] - sx_new[i])*((sy_new[j] + 0.5*(sy_old[j] - sy_new[j]))*sz_new[k] +
+                                                             (0.5*sy_new[j] + 1./3.*(sy_old[j] - sy_new[j]))*(sz_old[k] - sz_new[k]));
+                        amrex::Gpu::Atomic::Add( &Jx_arr(lo.x+i_new-1+i, lo.y+j_new-1+j, lo.z+k_new-1+k), sdxi);
                     }
-                    for (int k=dkl; k<=depos_order+2-dku; k++) {
-                        for (int i=dil; i<=depos_order+2-diu; i++) {
-                            const Real sdyj = wq*uyp[ip]*gaminv*invvol*((sz_new[k] + 0.5*(sz_old[k] - sz_new[k]))*sx_new[i] +
-                                        (0.5*sz_new[k] + 1./3.*(sz_old[k] - sz_new[k]))*(sx_old[i] - sx_new[i]));
-                            amrex::Gpu::Atomic::Add( &Jy_arr(lo.x+i_new-1+i, lo.y+k_new-1+k, 0), sdyj);
-                        }
+                }
+            }
+            for (int k=dkl; k<=depos_order+2-dku; k++) {
+                for (int i=dil; i<=depos_order+2-diu; i++) {
+                    amrex::Real sdyj = 0.;
+                    for (int j=djl; j<=depos_order+1-dju; j++) {
+                        sdyj += wqy*(sy_old[j] - sy_new[j])*((sz_new[k] + 0.5*(sz_old[k] - sz_new[k]))*sx_new[i] +
+                                                             (0.5*sz_new[k] + 1./3.*(sz_old[k] - sz_new[k]))*(sx_old[i] - sx_new[i]));
+                        amrex::Gpu::Atomic::Add( &Jy_arr(lo.x+i_new-1+i, lo.y+j_new-1+j, lo.z+k_new-1+k), sdyj);
                     }
-                    for (int i=dil; i<=depos_order+2-diu; i++) {
-                        Real sdzk = 0.;
-                        for (int k=dkl; k<=depos_order+1-dku; k++) {
-                            sdzk += wqz*(sz_old[k] - sz_new[k])*(sx_new[i] + 0.5*(sx_old[i] - sx_new[i]));
-                            amrex::Gpu::Atomic::Add( &Jz_arr(lo.x+i_new-1+i, lo.y+k_new-1+k, 0), sdzk);
-                        }
+                }
+            }
+            for (int j=djl; j<=depos_order+2-dju; j++) {
+                for (int i=dil; i<=depos_order+2-diu; i++) {
+                    amrex::Real sdzk = 0.;
+                    for (int k=dkl; k<=depos_order+1-dku; k++) {
+                        sdzk += wqz*(sz_old[k] - sz_new[k])*((sx_new[i] + 0.5*(sx_old[i] - sx_new[i]))*sy_new[j] +
+                                                             (0.5*sx_new[i] + 1./3.*(sx_old[i] - sx_new[i]))*(sy_old[j] - sy_new[j]));
+                        amrex::Gpu::Atomic::Add( &Jz_arr(lo.x+i_new-1+i, lo.y+j_new-1+j, lo.z+k_new-1+k), sdzk);
                     }
+                }
+            }
 
-#endif
-                 }
-        );
-
+#elif (AMREX_SPACEDIM == 2)
 
+            for (int k=dkl; k<=depos_order+2-dku; k++) {
+                amrex::Real sdxi = 0.;
+                for (int i=dil; i<=depos_order+1-diu; i++) {
+                    sdxi += wqx*(sx_old[i] - sx_new[i])*(sz_new[k] + 0.5*(sz_old[k] - sz_new[k]));
+                    amrex::Gpu::Atomic::Add( &Jx_arr(lo.x+i_new-1+i, lo.y+k_new-1+k, 0), sdxi);
+                }
+            }
+            for (int k=dkl; k<=depos_order+2-dku; k++) {
+                for (int i=dil; i<=depos_order+2-diu; i++) {
+                    const amrex::Real sdyj = wq*uyp[ip]*gaminv*invvol*((sz_new[k] + 0.5*(sz_old[k] - sz_new[k]))*sx_new[i] +
+                                                                       (0.5*sz_new[k] + 1./3.*(sz_old[k] - sz_new[k]))*(sx_old[i] - sx_new[i]));
+                    amrex::Gpu::Atomic::Add( &Jy_arr(lo.x+i_new-1+i, lo.y+k_new-1+k, 0), sdyj);
+                }
+            }
+            for (int i=dil; i<=depos_order+2-diu; i++) {
+                amrex::Real sdzk = 0.;
+                for (int k=dkl; k<=depos_order+1-dku; k++) {
+                    sdzk += wqz*(sz_old[k] - sz_new[k])*(sx_new[i] + 0.5*(sx_old[i] - sx_new[i]));
+                    amrex::Gpu::Atomic::Add( &Jz_arr(lo.x+i_new-1+i, lo.y+k_new-1+k, 0), sdzk);
+                }
+            }
 
+#endif
+        }
+        );
 }
 
 #endif // CURRENTDEPOSITION_H_
diff --git a/Source/Particles/ShapeFactors.H b/Source/Particles/ShapeFactors.H
index 6258f05af..9d185714a 100644
--- a/Source/Particles/ShapeFactors.H
+++ b/Source/Particles/ShapeFactors.H
@@ -1,20 +1,21 @@
 #ifndef SHAPEFACTORS_H_
 #define SHAPEFACTORS_H_
 
-using namespace amrex;
-
 // Compute shape factor and return index of leftmost cell where 
 // particle writes.
-// Specialized templates are defined below for orders 1, 2 and 3.
+// Specialized templates are defined below for orders 0 to 3.
 template <int depos_order>
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-int compute_shape_factor(Real* const sx, Real xint) {return 0;};
+int compute_shape_factor(amrex::Real* const sx, amrex::Real xint)
+{
+    return 0;
+};
 
 // Compute shape factor for order 0.
 template <>
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-int compute_shape_factor <0> (Real* const sx, Real xmid){
-    int j = (int) (xmid+0.5);
+int compute_shape_factor <0> (amrex::Real* const sx, amrex::Real xmid){
+    const int j = (int) (xmid+0.5);
     sx[0] = 1.0;
     return j;
 }
@@ -22,9 +23,9 @@ int compute_shape_factor <0> (Real* const sx, Real xmid){
 // Compute shape factor for order 1.
 template <>
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-int compute_shape_factor <1> (Real* const sx, Real xmid){
-    int j = (int) xmid;
-    Real xint = xmid-j;
+int compute_shape_factor <1> (amrex::Real* const sx, amrex::Real xmid){
+    const int j = (int) xmid;
+    const amrex::Real xint = xmid-j;
     sx[0] = 1.0 - xint;
     sx[1] = xint;
     return j;
@@ -33,9 +34,9 @@ int compute_shape_factor <1> (Real* const sx, Real xmid){
 // Compute shape factor for order 2.
 template <>
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-int compute_shape_factor <2> (Real* const sx, Real xmid){
-    int j = (int) (xmid+0.5);
-    Real xint = xmid-j;
+int compute_shape_factor <2> (amrex::Real* const sx, amrex::Real xmid){
+    const int j = (int) (xmid+0.5);
+    const amrex::Real xint = xmid-j;
     sx[0] = 0.5*(0.5-xint)*(0.5-xint);
     sx[1] = 0.75-xint*xint;
     sx[2] = 0.5*(0.5+xint)*(0.5+xint);
@@ -46,9 +47,9 @@ int compute_shape_factor <2> (Real* const sx, Real xmid){
 // Compute shape factor for order 3.
 template <>
 AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
-int compute_shape_factor <3> (Real* const sx, Real xmid){
-    int j = (int) xmid;
-    Real xint = xmid-j;
+int compute_shape_factor <3> (amrex::Real* const sx, amrex::Real xmid){
+    const int j = (int) xmid;
+    const amrex::Real xint = xmid-j;
     sx[0] = 1.0/6.0*(1.0-xint)*(1.0-xint)*(1.0-xint);
     sx[1] = 2.0/3.0-xint*xint*(1-xint/2.0);
     sx[2] = 2.0/3.0-(1-xint)*(1-xint)*(1.0-0.5*(1-xint));
@@ -57,4 +58,60 @@ int compute_shape_factor <3> (Real* const sx, Real xmid){
     return j-1;
 }
 
+// Compute shifted shape factor and return index of leftmost cell where
+// particle writes, for Esirkepov algorithm.
+// Specialized templates are defined below for orders 1, 2 and 3.
+template <int depos_order>
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+int compute_shifted_shape_factor (amrex::Real* const sx,
+                                  const amrex::Real x_old,
+                                  const int i_new);
+
+// Compute shape factor for order 1.
+template <>
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+int compute_shifted_shape_factor <1> (amrex::Real* const sx,
+                                      const amrex::Real x_old,
+                                      const int i_new){
+    const int i = (int) x_old;
+    const int i_shift = i - i_new;
+    const amrex::Real xint = x_old - i;
+    sx[1+i_shift] = 1.0 - xint;
+    sx[2+i_shift] = xint;
+    return i;
+}
+
+// Compute shape factor for order 2.
+template <>
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+int compute_shifted_shape_factor <2> (amrex::Real* const sx,
+                                      const amrex::Real x_old,
+                                      const int i_new){
+    const int i = (int) (x_old+0.5);
+    const int i_shift = i - (i_new + 1);
+    const amrex::Real xint = x_old - i;
+    sx[1+i_shift] = 0.5*(0.5-xint)*(0.5-xint);
+    sx[2+i_shift] = 0.75-xint*xint;
+    sx[3+i_shift] = 0.5*(0.5+xint)*(0.5+xint);
+    // index of the leftmost cell where particle deposits
+    return i-1;
+}
+
+// Compute shape factor for order 3.
+template <>
+AMREX_GPU_HOST_DEVICE AMREX_FORCE_INLINE
+int compute_shifted_shape_factor <3> (amrex::Real* const sx,
+                                      const amrex::Real x_old,
+                                      const int i_new){
+    const int i = (int) x_old;
+    const int i_shift = i - (i_new + 1);
+    const amrex::Real xint = x_old - i;
+    sx[1+i_shift] = 1.0/6.0*(1.0-xint)*(1.0-xint)*(1.0-xint);
+    sx[2+i_shift] = 2.0/3.0-xint*xint*(1-xint/2.0);
+    sx[3+i_shift] = 2.0/3.0-(1-xint)*(1-xint)*(1.0-0.5*(1-xint));
+    sx[4+i_shift] = 1.0/6.0*xint*xint*xint;
+    // index of the leftmost cell where particle deposits
+    return i-1;
+}
+
 #endif // SHAPEFACTORS_H_