1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
|
/* Copyright 2019-2020 Luca Fedeli, Maxence Thevenet
*
* This file is part of WarpX.
*
* License: BSD-3-Clause-LBNL
*/
#include "NCIGodfreyFilter.H"
#include "Utils/NCIGodfreyTables.H"
#include "Utils/TextMsg.H"
#include <AMReX.H>
#include <AMReX_Algorithm.H>
#include <AMReX_BLassert.H>
#include <AMReX_Config.H>
#include <AMReX_Dim3.H>
#include <AMReX_GpuContainers.H>
#include <AMReX_GpuDevice.H>
#include <AMReX_IntVect.H>
#include <AMReX_Vector.H>
#include <vector>
using namespace amrex;
NCIGodfreyFilter::NCIGodfreyFilter(godfrey_coeff_set coeff_set, amrex::Real cdtodz, bool nodal_gather){
// Store parameters into class data members
m_coeff_set = coeff_set;
m_cdtodz = cdtodz;
m_nodal_gather = nodal_gather;
// NCI Godfrey filter has fixed size, and is applied along z only.
#if defined(WARPX_DIM_3D)
stencil_length_each_dir = {1,1,5};
slen = {1,1,5};
#elif defined(WARPX_DIM_XZ) || defined(WARPX_DIM_RZ)
stencil_length_each_dir = {1,5};
slen = {1,5,1};
#else
amrex::ignore_unused(coeff_set, cdtodz, nodal_gather);
WARPX_ABORT_WITH_MESSAGE(
"NCIGodfreyFilter not implemented in 1D!");
#endif
}
void NCIGodfreyFilter::ComputeStencils(){
#if (AMREX_SPACEDIM >= 2)
using namespace warpx::nci_godfrey;
// Sanity checks: filter length shoulz be 5 in z
#if defined(WARPX_DIM_3D)
WARPX_ALWAYS_ASSERT_WITH_MESSAGE(
slen.z==5,"ERROR: NCI filter requires 5 points in z");
#else
WARPX_ALWAYS_ASSERT_WITH_MESSAGE(
slen.y==5,"ERROR: NCI filter requires 5 points in z");
#endif
// Interpolate coefficients from the table, and store into prestencil.
auto index = static_cast<int>(tab_length*m_cdtodz);
index = min(index, tab_length-2);
index = max(index, 0);
Real const weight_right = m_cdtodz - amrex::Real(index)/amrex::Real(tab_length);
Real prestencil[4];
// read prestencil coefficients from table (the stencil is computed from
// these coefficients)
for(int i=0; i<tab_width; i++){
if (!m_nodal_gather)
{
// If gather from staggered grid, use coefficients for Galerkin gather
if (m_coeff_set == godfrey_coeff_set::Ex_Ey_Bz){
// Set of coefficients for Ex, Ey and Bz
prestencil[i] = (1_rt-weight_right)*table_nci_godfrey_galerkin_Ex_Ey_Bz[index ][i] +
weight_right *table_nci_godfrey_galerkin_Ex_Ey_Bz[index+1][i];
} else if (m_coeff_set == godfrey_coeff_set::Bx_By_Ez){
// Set of coefficients for Bx, By and Ez
prestencil[i] = (1_rt-weight_right)*table_nci_godfrey_galerkin_Bx_By_Ez[index ][i] +
weight_right *table_nci_godfrey_galerkin_Bx_By_Ez[index+1][i];
} else {
WARPX_ABORT_WITH_MESSAGE(
"m_coeff_set must be godfrey_coeff_set::Ex_Ey_Bz or godfrey_coeff_set::Bx_By_Ez");
}
}
else
{
// If gather from node-centered grid, use coefficients for momentum-conserving gather
if (m_coeff_set == godfrey_coeff_set::Ex_Ey_Bz){
// Set of coefficients for Ex, Ey and Bz
prestencil[i] = (1_rt-weight_right)*table_nci_godfrey_momentum_Ex_Ey_Bz[index ][i] +
weight_right *table_nci_godfrey_momentum_Ex_Ey_Bz[index+1][i];
} else if (m_coeff_set == godfrey_coeff_set::Bx_By_Ez) {
// Set of coefficients for Bx, By and Ez
prestencil[i] = (1_rt-weight_right)*table_nci_godfrey_momentum_Bx_By_Ez[index ][i] +
weight_right *table_nci_godfrey_momentum_Bx_By_Ez[index+1][i];
} else {
WARPX_ABORT_WITH_MESSAGE(
"m_coeff_set must be godfrey_coeff_set::Ex_Ey_Bz or godfrey_coeff_set::Bx_By_Ez");
}
}
}
// Compute stencil_z
Vector<Real> h_stencil_z(5);
h_stencil_z[0] = (256 + 128*prestencil[0] + 96*prestencil[1] + 80*prestencil[2] + 70*prestencil[3]) / 256;
h_stencil_z[1] = -( 64*prestencil[0] + 64*prestencil[1] + 60*prestencil[2] + 56*prestencil[3]) / 256;
h_stencil_z[2] = ( 16*prestencil[1] + 24*prestencil[2] + 28*prestencil[3]) / 256;
h_stencil_z[3] = -( 4*prestencil[2] + 8*prestencil[3]) / 256;
h_stencil_z[4] = ( 1*prestencil[3]) / 256;
// Compute h_stencil_x and h_stencil_y (no filter in these directions,
// so only 1 coeff, equal to 1)
Vector<Real> h_stencil_x(1);
h_stencil_x[0] = 1._rt;
#if defined(WARPX_DIM_3D)
Vector<Real> h_stencil_y(1);
h_stencil_y[0] = 1._rt;
#endif
// Due to the way Filter::DoFilter() is written,
// coefficient 0 has to be /2
h_stencil_x[0] /= 2._rt;
#if defined(WARPX_DIM_3D)
h_stencil_y[0] /= 2._rt;
#endif
h_stencil_z[0] /= 2._rt;
stencil_x.resize(h_stencil_x.size());
#if defined(WARPX_DIM_3D)
stencil_y.resize(h_stencil_y.size());
#endif
stencil_z.resize(h_stencil_z.size());
Gpu::copyAsync(Gpu::hostToDevice,h_stencil_x.begin(),h_stencil_x.end(),stencil_x.begin());
#if defined(WARPX_DIM_3D)
Gpu::copyAsync(Gpu::hostToDevice,h_stencil_y.begin(),h_stencil_y.end(),stencil_y.begin());
#endif
Gpu::copyAsync(Gpu::hostToDevice,h_stencil_z.begin(),h_stencil_z.end(),stencil_z.begin());
Gpu::synchronize();
#else
WARPX_ABORT_WITH_MESSAGE("NCIGodfreyFilter not implemented in 1D!");
#endif
}
|