ERF
Energy Research and Forecasting: An Atmospheric Modeling Code
ERF_NCWpsFile.H
Go to the documentation of this file.
1 #ifndef ERF_NCWPSFILE_H_
2 #define ERF_NCWPSFILE_H_
3 
4 #include <sstream>
5 #include <string>
6 #include <atomic>
7 
8 #include "AMReX_FArrayBox.H"
9 #include "AMReX_IArrayBox.H"
10 #include "ERF_EpochTime.H"
11 #include "ERF_NCInterface.H"
12 
13 using PlaneVector = amrex::Vector<amrex::FArrayBox>;
14 
15 /*
16  // Read from metgrid
17  NetCDF variables of dimensions Time_BT_SN_WE: "UU", "VV", "TT", "RH", "PRES", "GHT"
18  NetCDF variables of dimensions Time_SN_WE : "HGT", "MAPFAC_U", "MAPFAC_V", "MAPFAC_M", "PSFC"
19  NetCDF global attributes of type int : "WEST-EAST_GRID_DIMENSION", "SOUTH-NORTH_GRID_DIMENSION"
20  NetCDF global attributes of type string : "SIMULATION_START_DATE"
21  NetCDF global attributes of type real : "DX", "DY"
22 
23  // Read from wrfbdy
24  NetCDF variables of dimensions Time_BdyWidth_BT_SN : "U_BXS", "U_BXE", "V_BXS", "V_BXE" etc.
25  NetCDF variables of dimensions Time_BdyWidth_BT_WE : "U_BYS", "U_BYE", "V_BYS", "V_BYE" etc.
26  NetCDF variables of dimensions Time_BdyWidth_SN : "MU_BXS", "MU_BXE", "PC_BXS", "PC_BXE", etc.
27  NetCDF variables of dimensions Time_BdyWidth_WE : "MU_BYS", "MU_BYE", "PC_BYS", "PC_BYE", etc.
28 */
29 enum class NC_Data_Dims_Type {
30  Time_SL_SN_WE, // Time, Soil Layers, South-North, West-East
32  Time_SN_WE,
33  Time_BT,
34  Time_SL, // Time, Soil layers
35  Time,
40 };
41 
42 //
43 // NDArray is the datatype designed to hold any data, including scalars, multidimensional
44 // arrays, that read from the NetCDF file.
45 //
46 // The data read from NetCDF file are stored in a continuous memory, and the data layout is described
47 // by using a vector (shape). AMRex Box can be constructed using the data shape information, and MultiFab
48 // data array can be setup using the data that stored in the NDArray.
49 //
50 template <typename DataType>
51 struct NDArray
52 {
53  using DType = typename std::remove_const<DataType>::type;
54 
55  // constructor
56  explicit NDArray (const std::string vname, const std::vector<size_t>& vshape)
57  : name{vname}, shape{vshape}, ref_counted{1}, owned{true} {
58  data = new DType [this->ndim()];
59  }
60 
61  // default constructor
62  NDArray () : name{"null"}, ref_counted{1}, owned{false}, data{nullptr} {}
63 
64  // copy constructor
65  NDArray (const NDArray& array) {
66  name = array.name;
67  shape = array.shape;
68  data = array.data;
69  owned = false;
70  ref_counted.fetch_add(1, std::memory_order_relaxed);
71  }
72 
73  // copy assignment
74  NDArray& operator=(const NDArray& array) {
75  name = array.name;
76  shape = array.shape;
77  data = array.data;
78  owned = false;
79  ref_counted.fetch_add(1, std::memory_order_relaxed);
80  return *this;
81  }
82 
83  // destructor
84  ~NDArray () {
85  ref_counted.fetch_sub(1, std::memory_order_acq_rel);
86  if (ref_counted == 1 && owned) delete[] data;
87  }
88 
89  // get the data pointer
90  decltype(auto) get_data () {
91  ref_counted.fetch_add(1, std::memory_order_relaxed);
92  return data;
93  }
94 
95  // get the variable name
96  std::string get_vname () {
97  return name;
98  }
99 
100  // get the variable data shape
101  std::vector<size_t> get_vshape () {
102  return shape;
103  }
104 
105  // return the total number of data
106  size_t ndim () {
107  size_t num = 1;
108  int isize = static_cast<int>(shape.size());
109  for (auto i=0; i<isize; ++i) num *= shape[i];
110  return num;
111  }
112 
113  // set the data shape information
114  void set_vshape (std::vector<size_t> vshape) {
115  shape = vshape;
116  }
117 
118  private:
119  std::string name;
120  std::vector<size_t> shape;
121  mutable std::atomic<size_t> ref_counted;
122  bool owned;
124 };
125 
126 int BuildFABsFromWRFBdyFile (const std::string &fname,
127  amrex::Vector<amrex::Vector<amrex::FArrayBox>>& bdy_data_xlo,
128  amrex::Vector<amrex::Vector<amrex::FArrayBox>>& bdy_data_xhi,
129  amrex::Vector<amrex::Vector<amrex::FArrayBox>>& bdy_data_ylo,
130  amrex::Vector<amrex::Vector<amrex::FArrayBox>>& bdy_data_yhi);
131 
132 template<typename DType>
133 void ReadTimeSliceFromNetCDFFile (const std::string& fname,
134  const int tidx,
135  amrex::Vector<std::string> names,
136  amrex::Vector<NDArray<DType> >& arrays,
137  amrex::Vector<int>& success)
138 {
139  amrex::Print() << "Reading time slice " << tidx << " from " << fname << std::endl;
140  AMREX_ASSERT(arrays.size() == names.size());
141 
142  if (amrex::ParallelDescriptor::IOProcessor())
143  {
144  auto ncf = ncutils::NCFile::open(fname, NC_CLOBBER | NC_NETCDF4);
145 
146  int ntimes = ncf.dim("Time").len();
147  AMREX_ALWAYS_ASSERT((tidx >= 0) && (tidx < ntimes));
148 
149  for (auto n=0; n<arrays.size(); ++n)
150  {
151  std::string vname_to_write = names[n];
152  std::string vname_to_read = names[n];
153  if (vname_to_read.substr(0,2) == "R_") {
154  vname_to_read = names[n+4]; // This allows us to read "T" instead -- we will over-write this later
155  }
156 
157  success[n] = ncf.has_var(vname_to_read);
158 
159  if (success[n] == 1)
160  {
161  std::vector<std::string> dimnames = ncf.var(vname_to_read).dimnames();
162  AMREX_ALWAYS_ASSERT(dimnames[0] == "Time");
163 
164  std::vector<size_t> count = ncf.var(vname_to_read).shape();
165  std::vector<size_t> start(count.size(), 0);
166  start[0] = tidx;
167  count[0] = 1;
168 
169  arrays[n] = NDArray<DType>(vname_to_read, count);
170  DType* dataPtr = arrays[n].get_data();
171 
172  ncf.var(vname_to_read).get(dataPtr, start, count);
173  } // has_var
174  }
175  ncf.close();
176  }
177 }
178 
179 template<typename DType>
180 void ReadNetCDFFile (const std::string& fname, amrex::Vector<std::string> names,
181  amrex::Vector<NDArray<DType> >& arrays, amrex::Vector<int>& success)
182 {
183  AMREX_ASSERT(arrays.size() == names.size());
184 
185  if (amrex::ParallelDescriptor::IOProcessor())
186  {
187  auto ncf = ncutils::NCFile::open(fname, NC_CLOBBER | NC_NETCDF4);
188 
189  /*
190  // get the dimension information
191  int Time = static_cast<int>(ncf.dim("Time").len());
192  int DateStrLen = static_cast<int>(ncf.dim("DateStrLen").len());
193  int west_east = static_cast<int>(ncf.dim("west_east").len());
194  int south_north = static_cast<int>(ncf.dim("south_north").len());
195  int bottom_top = static_cast<int>(ncf.dim("bottom_top").len());
196  int bottom_top_stag = static_cast<int>(ncf.dim("bottom_top_stag").len());
197  int west_east_stag = static_cast<int>(ncf.dim("west_east_stag").len());
198  int south_north_stag = static_cast<int>(ncf.dim("south_north_stag").len());
199  int bdy_width = static_cast<int>(ncf.dim("bdy_width").len());
200  */
201 
202  // amrex::Print() << "Reading the dimensions from the netcdf file " << "\n";
203 
204  for (auto n=0; n<arrays.size(); ++n)
205  {
206  std::string vname_to_write = names[n];
207  std::string vname_to_read = names[n];
208 
209  if (vname_to_read.substr(0,2) == "R_") {
210  vname_to_read = names[n+4]; // This allows us to read "T" instead -- we will over-write this later
211  }
212 
213  success[n] = ncf.has_var(vname_to_read);
214  if (success[n] == 0) {
215  amrex::Print() << " Skipping " << vname_to_read << std::endl;
216  } else {
217  amrex::Print() << " Reading " << vname_to_read << std::endl;
218  }
219 
220  if (success[n] == 1) {
221 
222  std::vector<std::string> dimnames = ncf.var(vname_to_read).dimnames();
223  AMREX_ALWAYS_ASSERT(dimnames[0] == "Time" || dimnames[0] == "time");
224 
225  std::vector<size_t> shape = ncf.var(vname_to_read).shape();
226  arrays[n] = NDArray<DType>(vname_to_read,shape);
227  DType* dataPtr = arrays[n].get_data();
228 
229  std::vector<size_t> start(shape.size(), 0);
230 
231 #if 0
232  auto numPts = arrays[n].ndim();
233  amrex::Print() << "NetCDF Variable name = " << vname_to_read << std::endl;
234  amrex::Print() << "numPts read from NetCDF file/var = " << numPts << std::endl;
235  amrex::Print() << "Dims in var = " << ncf.var(vname_to_read).ndim() << std::endl;
236  amrex::Print() << "Dim names = (";
237  for (auto &dim:dimnames)
238  amrex::Print() << dim << ", " ;
239  amrex::Print() << ")" << std::endl;
240  amrex::Print() << "Dims of the variable = (";
241  for (auto &dim:shape)
242  amrex::Print() << dim << ", " ;
243  amrex::Print() << ")" << std::endl;
244 #endif
245 
246  ncf.var(vname_to_read).get(dataPtr, start, shape);
247 
248  } // has_var
249  }
250  ncf.close();
251  }
252 }
253 
254 /**
255  * Helper function for reading data from NetCDF file into a
256  * provided FAB.
257  *
258  * @param iv Index for which variable we are going to fill
259  * @param nc_arrays Arrays of data from NetCDF file
260  * @param var_name Variable name
261  * @param NC_dim_type Dimension type for the variable as stored in the NetCDF file
262  * @param temp FAB where we store the variable data from the NetCDF Arrays
263  */
264 template<class FAB,typename DType>
265 void
267  const amrex::Box& domain,
268  amrex::Vector<NDArray<float>>& nc_arrays,
269  const std::string& var_name,
270  NC_Data_Dims_Type& NC_dim_type,
271  FAB& temp)
272 {
273  int ns1, ns2, ns3; // bottom_top, south_north, west_east (these can be staggered or unstaggered)
274  if (NC_dim_type == NC_Data_Dims_Type::Time_BT) {
275  ns1 = nc_arrays[iv].get_vshape()[1];
276  ns2 = 1;
277  ns3 = 1;
278  // amrex::Print() << "TYPE BT " << ns1 << std::endl;
279  } else if (NC_dim_type == NC_Data_Dims_Type::Time_SN_WE) {
280  ns1 = 1;
281  ns2 = nc_arrays[iv].get_vshape()[1];
282  ns3 = nc_arrays[iv].get_vshape()[2];
283  // amrex::Print() << "TYPE SN WE " << ns2 << " " << ns3 << std::endl;
284  } else if (NC_dim_type == NC_Data_Dims_Type::Time_BT_SN_WE) {
285  ns1 = nc_arrays[iv].get_vshape()[1];
286  ns2 = nc_arrays[iv].get_vshape()[2];
287  ns3 = nc_arrays[iv].get_vshape()[3];
288  // amrex::Print() << "TYPE BT SN WE " << ns1 << " " << ns2 << " " << ns3 << std::endl;
289  } else if (NC_dim_type == NC_Data_Dims_Type::Time_SL_SN_WE) {
290  ns1 = nc_arrays[iv].get_vshape()[1];
291  ns2 = nc_arrays[iv].get_vshape()[2];
292  ns3 = nc_arrays[iv].get_vshape()[3];
293  // amrex::Print() << "TYPE SL SN WE " << ns1 << " " << ns2 << " " << ns3 << std::endl;
294  } else if (NC_dim_type == NC_Data_Dims_Type::Time_SL) {
295  ns1 = nc_arrays[iv].get_vshape()[1];
296  ns2 = 1;
297  ns3 = 1;
298  // amrex::Print() << "TYPE SL " << ns1 << std::endl;
299  }
300  else {
301  amrex::Abort("Dont know this NC_Data_Dims_Type");
302  }
303 
304  // allow fewer z levels to be read in
305  // - ns1 may be the bottom_top or bottom_top_stag dim
306  // - domain.bigEnd(2) is the input number of cells in z
307  // - khi may be nz==bottom_top, nz < bottom_top, or 0 for 2D fields
308  int khi = std::min(domain.bigEnd(2), ns1-1);
309 
310  // TODO: The box will only start at (0,0,0) at level 0 -- we need to generalize this
311  amrex::Box in_box(amrex::IntVect(0,0,0), amrex::IntVect(ns3-1,ns2-1,ns1-1)); // ns1 may or may not be staggered
312  amrex::Box my_box(amrex::IntVect(0,0,0), amrex::IntVect(ns3-1,ns2-1,khi));
313 
314  if (var_name == "PH" || var_name == "PHB") {
315  my_box.setType(amrex::IndexType(amrex::IntVect(0,0,1)));
316  my_box.setBig(2, khi+1);
317  }
318  else if (var_name == "U" || var_name == "UU" || var_name == "MAPFAC_U") {
319  my_box.setType(amrex::IndexType(amrex::IntVect(1,0,0)));
320  }
321  else if (var_name == "V" || var_name == "VV" || var_name == "MAPFAC_V") {
322  my_box.setType(amrex::IndexType(amrex::IntVect(0,1,0)));
323  }
324  else if (var_name == "W" || var_name == "WW") {
325  my_box.setType(amrex::IndexType(amrex::IntVect(0,0,1)));
326  my_box.setBig(2, khi+1);
327  }
328  else if (var_name == "TSLB" || var_name == "SMOIS" || var_name == "SH2O" || var_name == "ZS" || var_name == "DZS") {
329  // soil variables are staggered in z
330  my_box.setType(amrex::IndexType(amrex::IntVect(0,0,1)));
331  }
332 
333  amrex::Arena* Arena_Used = amrex::The_Arena();
334 #ifdef AMREX_USE_GPU
335  // Make sure temp lives on CPU since nc_arrays lives on CPU only
336  Arena_Used = amrex::The_Pinned_Arena();
337 #endif
338  temp.resize(my_box,1, Arena_Used);
339  amrex::Array4<DType> fab_arr = temp.array();
340 
341  int ioff = temp.box().smallEnd()[0];
342  int joff = temp.box().smallEnd()[1];
343  int kmax = temp.box().bigEnd()[2]; // highest z level to be read in
344  //amrex::Print() << var_name << " domain khi, kmax, ns1 = " << khi << " " << kmax << " " << ns1 << std::endl;
345 
346  auto num_pts = in_box.numPts();
347 
348  for (int n(0); n < num_pts; ++n) {
349  int k = n / (ns2*ns3);
350  if (k > kmax) continue;
351  int j = (n - k*(ns2*ns3)) / ns3 + joff;
352  int i = n - k*(ns2*ns3) - (j-joff) * ns3 + ioff;
353  fab_arr(i,j,k,0) = static_cast<DType>(*(nc_arrays[iv].get_data()+n));
354  }
355 }
356 
357 /**
358  * Function to read NetCDF variables and fill the corresponding Array4's
359  *
360  * @param fname Name of the NetCDF file to be read
361  * @param nc_var_names Variable names in the NetCDF file
362  * @param NC_dim_types NetCDF data dimension types
363  * @param fab_vars Fab data we are to fill
364  */
365 template<class FAB,typename DType>
366 void
367 BuildFABsFromNetCDFFile (const amrex::Box& domain,
368  const std::string &fname,
369  amrex::Vector<std::string> nc_var_names,
370  amrex::Vector<enum NC_Data_Dims_Type> NC_dim_types,
371  amrex::Vector<FAB*> fab_vars,
372  amrex::Vector<int>& success)
373 {
374  int ioproc = amrex::ParallelDescriptor::IOProcessorNumber(); // I/O rank
375 
376  amrex::Vector<NDArray<float>> nc_arrays(nc_var_names.size());
377 
378  if (amrex::ParallelDescriptor::IOProcessor())
379  {
380  ReadNetCDFFile(fname, nc_var_names, nc_arrays, success);
381  }
382 
383  amrex::ParallelDescriptor::Bcast(success.dataPtr(), success.size(), ioproc);
384 
385  for (int iv = 0; iv < nc_var_names.size(); iv++)
386  {
387  if (success[iv] == 1) {
388  FAB tmp;
389  if (amrex::ParallelDescriptor::IOProcessor()) {
390  fill_fab_from_arrays<FAB,DType>(iv, domain, nc_arrays, nc_var_names[iv], NC_dim_types[iv], tmp);
391  }
392 
393  int ncomp = tmp.nComp();
394  amrex::Box box = tmp.box();
395 
396  amrex::ParallelDescriptor::Bcast(&box, 1, ioproc);
397  amrex::ParallelDescriptor::Bcast(&ncomp, 1, ioproc);
398 
399  if (!amrex::ParallelDescriptor::IOProcessor()) {
400 #ifdef AMREX_USE_GPU
401  tmp.resize(box,ncomp,amrex::The_Pinned_Arena());
402 #else
403  tmp.resize(box,ncomp);
404 #endif
405  }
406 
407  amrex::ParallelDescriptor::Bcast(tmp.dataPtr(), tmp.size(), ioproc);
408 
409  // Shift box by the domain lower corner
410  amrex::Box fab_bx = tmp.box();
411  amrex::Dim3 dom_lb = lbound(domain);
412  fab_bx += amrex::IntVect(dom_lb.x,dom_lb.y,dom_lb.z);
413  // fab_vars points to data on device
414  fab_vars[iv]->resize(fab_bx,1);
415 #ifdef AMREX_USE_GPU
416  amrex::Gpu::copy(amrex::Gpu::hostToDevice,
417  tmp.dataPtr(), tmp.dataPtr() + tmp.size(),
418  fab_vars[iv]->dataPtr());
419 #else
420  // Provided by BaseFab inheritance through FArrayBox
421  fab_vars[iv]->copy(tmp,tmp.box(),0,fab_bx,0,1);
422 #endif
423  } // success
424  } // iv
425 }
426 #endif
@ num
Definition: ERF_DataStruct.H:22
void ReadNetCDFFile(const std::string &fname, amrex::Vector< std::string > names, amrex::Vector< NDArray< DType > > &arrays, amrex::Vector< int > &success)
Definition: ERF_NCWpsFile.H:180
NC_Data_Dims_Type
Definition: ERF_NCWpsFile.H:29
void fill_fab_from_arrays(int iv, const amrex::Box &domain, amrex::Vector< NDArray< float >> &nc_arrays, const std::string &var_name, NC_Data_Dims_Type &NC_dim_type, FAB &temp)
Definition: ERF_NCWpsFile.H:266
void BuildFABsFromNetCDFFile(const amrex::Box &domain, const std::string &fname, amrex::Vector< std::string > nc_var_names, amrex::Vector< enum NC_Data_Dims_Type > NC_dim_types, amrex::Vector< FAB * > fab_vars, amrex::Vector< int > &success)
Definition: ERF_NCWpsFile.H:367
amrex::Vector< amrex::FArrayBox > PlaneVector
Definition: ERF_NCWpsFile.H:13
int BuildFABsFromWRFBdyFile(const std::string &fname, amrex::Vector< amrex::Vector< amrex::FArrayBox >> &bdy_data_xlo, amrex::Vector< amrex::Vector< amrex::FArrayBox >> &bdy_data_xhi, amrex::Vector< amrex::Vector< amrex::FArrayBox >> &bdy_data_ylo, amrex::Vector< amrex::Vector< amrex::FArrayBox >> &bdy_data_yhi)
void ReadTimeSliceFromNetCDFFile(const std::string &fname, const int tidx, amrex::Vector< std::string > names, amrex::Vector< NDArray< DType > > &arrays, amrex::Vector< int > &success)
Definition: ERF_NCWpsFile.H:133
static NCFile open(const std::string &name, const int cmode=NC_NOWRITE)
Definition: ERF_NCInterface.cpp:707
Definition: ERF_NCWpsFile.H:52
bool owned
Definition: ERF_NCWpsFile.H:122
std::string name
Definition: ERF_NCWpsFile.H:119
size_t ndim()
Definition: ERF_NCWpsFile.H:106
NDArray()
Definition: ERF_NCWpsFile.H:62
std::string get_vname()
Definition: ERF_NCWpsFile.H:96
NDArray(const NDArray &array)
Definition: ERF_NCWpsFile.H:65
NDArray & operator=(const NDArray &array)
Definition: ERF_NCWpsFile.H:74
void set_vshape(std::vector< size_t > vshape)
Definition: ERF_NCWpsFile.H:114
NDArray(const std::string vname, const std::vector< size_t > &vshape)
Definition: ERF_NCWpsFile.H:56
std::atomic< size_t > ref_counted
Definition: ERF_NCWpsFile.H:121
typename std::remove_const< DataType >::type DType
Definition: ERF_NCWpsFile.H:53
std::vector< size_t > shape
Definition: ERF_NCWpsFile.H:120
DType * data
Definition: ERF_NCWpsFile.H:123
decltype(auto) get_data()
Definition: ERF_NCWpsFile.H:90
std::vector< size_t > get_vshape()
Definition: ERF_NCWpsFile.H:101
~NDArray()
Definition: ERF_NCWpsFile.H:84