IODA
ObsSpace.cc
Go to the documentation of this file.
1 /*
2  * (C) Copyright 2017-2021 UCAR
3  *
4  * This software is licensed under the terms of the Apache Licence Version 2.0
5  * which can be obtained at http://www.apache.org/licenses/LICENSE-2.0.
6  */
7 
8 #include "ioda/ObsSpace.h"
9 
10 #include <algorithm>
11 #include <cmath>
12 #include <fstream>
13 #include <iomanip>
14 #include <map>
15 #include <memory>
16 #include <set>
17 #include <string>
18 #include <utility>
19 #include <vector>
20 
21 #include "eckit/config/Configuration.h"
22 #include "eckit/exception/Exceptions.h"
23 
24 #include "oops/mpi/mpi.h"
25 #include "oops/util/abor1_cpp.h"
26 #include "oops/util/DateTime.h"
27 #include "oops/util/Duration.h"
28 #include "oops/util/Logger.h"
29 #include "oops/util/missingValues.h"
30 #include "oops/util/Random.h"
31 #include "oops/util/stringFunctions.h"
32 
33 #include "ioda/distribution/Accumulator.h"
34 #include "ioda/distribution/DistributionFactory.h"
35 #include "ioda/distribution/DistributionUtils.h"
36 #include "ioda/distribution/PairOfDistributions.h"
37 #include "ioda/Engines/HH.h"
38 #include "ioda/io/ObsFrameRead.h"
39 #include "ioda/io/ObsFrameWrite.h"
41 
42 namespace ioda {
43 
44 namespace {
45 
46 // If the variable name \p name ends with an underscore followed by a number (potentially a channel
47 // number), split it at that underscore, store the two parts in \p nameWithoutChannelSuffix and
48 // \p channel, and return true. Otherwise return false.
49 bool extractChannelSuffixIfPresent(const std::string &name,
50  std::string &nameWithoutChannelSuffix, int &channel) {
51  const std::string::size_type lastUnderscore = name.find_last_of('_');
52  if (lastUnderscore != std::string::npos &&
53  name.find_first_not_of("0123456789", lastUnderscore + 1) == std::string::npos) {
54  // The variable name has a numeric suffix.
55  channel = std::stoi(name.substr(lastUnderscore + 1));
56  nameWithoutChannelSuffix = name.substr(0, lastUnderscore);
57  return true;
58  }
59  return false;
60 }
61 
62 } // namespace
63 
64 // ----------------------------- public functions ------------------------------
65 // -----------------------------------------------------------------------------
67  // The following code needs to stay in sync with the ObsDimensionId enum object.
68  // The entries are the standard dimension names according to the unified naming convention.
69  std::string dimName = "nlocs";
73 
74  dimName = "nchans";
78 }
79 
80 ObsDimensionId ObsDimInfo::get_dim_id(const std::string & dimName) const {
81  return dim_name_id_.at(dimName);
82 }
83 
84 std::string ObsDimInfo::get_dim_name(const ObsDimensionId dimId) const {
85  return dim_id_name_.at(dimId);
86 }
87 
88 std::size_t ObsDimInfo::get_dim_size(const ObsDimensionId dimId) const {
89  return dim_id_size_.at(dimId);
90 }
91 
92 void ObsDimInfo::set_dim_size(const ObsDimensionId dimId, std::size_t dimSize) {
93  dim_id_size_.at(dimId) = dimSize;
94 }
95 
96 // -----------------------------------------------------------------------------
97 /*!
98  * \details Config based constructor for an ObsSpace object. This constructor will read
99  * in from the obs file and transfer the variables into the obs container. Obs
100  * falling outside the DA timing window, specified by bgn and end, will be
101  * discarded before storing them in the obs container.
102  *
103  * \param[in] config ECKIT configuration segment holding obs types specs
104  * \param[in] comm MPI communicator containing all processes that hold the observations for a
105  * given time slot or sub-window.
106  * \param[in] bgn DateTime object holding the start of the DA timing window
107  * \param[in] end DateTime object holding the end of the DA timing window
108  * \param[in] time MPI communicator across time so that the 2D array of processes represented by
109  * the product of the comm and time communicators hold all observations in the
110  * ObsSpace.
111  */
112 ObsSpace::ObsSpace(const Parameters_ & params, const eckit::mpi::Comm & comm,
113  const util::DateTime & bgn, const util::DateTime & end,
114  const eckit::mpi::Comm & timeComm)
115  : oops::ObsSpaceBase(params, comm, bgn, end),
116  winbgn_(bgn), winend_(end), commMPI_(comm),
117  gnlocs_(0), nrecs_(0), obsvars_(),
118  obs_group_(), obs_params_(params, bgn, end, comm, timeComm)
119 {
120  oops::Log::trace() << "ObsSpace::ObsSpace config = " << obs_params_.top_level_ << std::endl;
121 
124  if (obs_params_.top_level_.derivedSimVars.value().size() != 0) {
125  // As things stand, this assert cannot fail, since both variables take the list of channels
126  // from the same "channels" YAML option.
127  ASSERT(obs_params_.top_level_.derivedSimVars.value().channels() == obsvars_.channels());
129  }
130  oops::Log::info() << this->obsname() << " vars: " << obsvars_ << std::endl;
131 
132  // Open the source (ObsFrame) of the data for initializing the obs_group_ (ObsGroup)
133  ObsFrameRead obsFrame(obs_params_);
134 
135  // Retrieve the MPI distribution object
136  dist_ = obsFrame.distribution();
137 
138  createObsGroupFromObsFrame(obsFrame);
139  initFromObsSource(obsFrame);
140 
141  // After walking through all the frames, gnlocs_ and gnlocs_outside_timewindow_
142  // are set representing the entire file. This is because they are calculated
143  // before doing the MPI distribution.
144  gnlocs_ = obsFrame.globalNumLocs();
146 
147  if (this->obs_sort_var() != "") {
149  recidx_is_sorted_ = true;
150  } else {
151  // Fill the recidx_ map with indices that represent each group, but are not
152  // sorted. This is done so the recidx_ structure can be used to walk
153  // through the individual groups. For example, this can be used to calculate
154  // RMS values for each group.
156  recidx_is_sorted_ = false;
157  }
158 
160 
161  if (obs_params_.top_level_.obsExtend.value() != boost::none) {
163  }
164 
165  /// If save_obs_distribution set to true,
166  /// global location indices and record numbers will be stored
167  /// in the MetaData/saved_index and MetaData/saved_record_number variables, respectively.
168  /// These variables will be saved along with all other variables
169  /// to the output files generated if the obsdataout.obsfile option is set.
170  ///
171  /// When the "obsdatain.read obs from separate file" option is set for later runs,
172  /// each process reads a separate input file directly,
173  /// the presence of these variables makes it possible
174  /// to identify observations stored in more than one input file.
175 
176  const bool save_obs_distribution = obs_params_.top_level_.saveObsDistribution;
177  if (save_obs_distribution && "Halo" == obs_params_.top_level_.distName.value()) {
178  const size_t nlocs = this->nlocs();
179 
180  std::vector<int> idx2int(nlocs);
181  std::vector<int> rec2int(nlocs);
182 
183  for (size_t loc = 0; loc < nlocs; ++loc) {
184  idx2int[loc] = static_cast<int>(indx_[loc]);
185  rec2int[loc] = static_cast<int>(recnums_[loc]);
186  }
187 
188  // Save Index and Records
189  put_db("MetaData", "saved_index", idx2int);
190  put_db("MetaData", "saved_record_number", rec2int);
191  }
192 
194 
195  oops::Log::debug() << obsname() << ": " << globalNumLocsOutsideTimeWindow()
196  << " observations are outside of time window out of "
198  << std::endl;
199 
200  oops::Log::trace() << "ObsSpace::ObsSpace constructed name = " << obsname() << std::endl;
201 }
202 
203 // -----------------------------------------------------------------------------
204 void ObsSpace::save() {
205  if (obs_params_.top_level_.obsOutFile.value() != boost::none) {
206  std::string fileName = obs_params_.top_level_.obsOutFile.value()->fileName;
207  oops::Log::info() << obsname() << ": save database to " << fileName << std::endl;
208  saveToFile();
209  // Call the mpi barrier command here to force all processes to wait until
210  // all processes have finished writing their files. This is done to prevent
211  // the early processes continuing and potentially executing their obs space
212  // destructor before others finish writing. This situation is known to have
213  // issues with hdf file handles getting deallocated before some of the MPI
214  // processes are finished with them.
215  this->comm().barrier();
216  } else {
217  oops::Log::info() << obsname() << " : no output" << std::endl;
218  }
219 }
220 
221 // -----------------------------------------------------------------------------
222 std::size_t ObsSpace::nvars() const {
223  // Nvars is the number of variables in the ObsValue group. By querying
224  // the ObsValue group, nvars will keep track of new variables that are added
225  // during a run.
226  // Some of the generators, upon construction, do not create variables in ObsValue
227  // since the MakeObs function will do that. In this case, they instead create
228  // error estimates in ObsError with the expectation that ObsValue will be filled
229  // in later. So upon construction, nvars will be the number of variables in ObsError
230  // instead of ObsValue.
231  // Because of the generator case above, query ObsValue first and if ObsValue doesn't
232  // exist query ObsError.
233  std::size_t numVars = 0;
234  if (obs_group_.exists("ObsValue")) {
235  numVars = obs_group_.open("ObsValue").vars.list().size();
236  } else if (obs_group_.exists("ObsError")) {
237  numVars = obs_group_.open("ObsError").vars.list().size();
238  }
239  return numVars;
240 }
241 
242 // -----------------------------------------------------------------------------
243 const std::vector<std::string> & ObsSpace::obs_group_vars() const {
244  return obs_params_.top_level_.obsIoInParameters().obsGrouping.value().obsGroupVars;
245 }
246 
247 // -----------------------------------------------------------------------------
248 std::string ObsSpace::obs_sort_var() const {
249  return obs_params_.top_level_.obsIoInParameters().obsGrouping.value().obsSortVar;
250 }
251 
252 // -----------------------------------------------------------------------------
253 std::string ObsSpace::obs_sort_order() const {
254  return obs_params_.top_level_.obsIoInParameters().obsGrouping.value().obsSortOrder;
255 }
256 
257 // -----------------------------------------------------------------------------
258 /*!
259  * \details This method checks for the existence of the group, name combination
260  * in the obs container. If the combination exists, "true" is returned,
261  * otherwise "false" is returned.
262  */
263 bool ObsSpace::has(const std::string & group, const std::string & name, bool skipDerived) const {
264  // For backward compatibility, recognize and handle appropriately variable names with
265  // channel suffixes.
266  std::string nameToUse;
267  std::vector<int> chanSelectToUse;
268  splitChanSuffix(group, name, { }, nameToUse, chanSelectToUse, skipDerived);
269  return obs_group_.vars.exists(fullVarName(group, nameToUse)) ||
270  (!skipDerived && obs_group_.vars.exists(fullVarName("Derived" + group, nameToUse)));
271 }
272 
273 // -----------------------------------------------------------------------------
274 ObsDtype ObsSpace::dtype(const std::string & group, const std::string & name,
275  bool skipDerived) const {
276  // For backward compatibility, recognize and handle appropriately variable names with
277  // channel suffixes.
278  std::string nameToUse;
279  std::vector<int> chanSelectToUse;
280  splitChanSuffix(group, name, { }, nameToUse, chanSelectToUse, skipDerived);
281 
282  std::string groupToUse = "Derived" + group;
283  if (skipDerived || !obs_group_.vars.exists(fullVarName(groupToUse, nameToUse)))
284  groupToUse = group;
285 
286  // Set the type to None if there is no type from the backend
287  ObsDtype VarType = ObsDtype::None;
288  if (has(groupToUse, nameToUse, skipDerived)) {
289  Variable var = obs_group_.vars.open(fullVarName(groupToUse, nameToUse));
290  if (var.isA<int>()) {
291  VarType = ObsDtype::Integer;
292  } else if (var.isA<float>()) {
293  VarType = ObsDtype::Float;
294  } else if (var.isA<std::string>()) {
295  if ((group == "MetaData") && (nameToUse == "datetime")) {
296  // TODO(srh) Workaround to cover when datetime was stored
297  // as a util::DateTime object. For now, ioda will store datetimes
298  // as strings and convert to DateTime objects for client access.
299  VarType = ObsDtype::DateTime;
300  } else {
301  VarType = ObsDtype::String;
302  }
303  }
304  }
305  return VarType;
306 }
307 
308 // -----------------------------------------------------------------------------
309 void ObsSpace::get_db(const std::string & group, const std::string & name,
310  std::vector<int> & vdata,
311  const std::vector<int> & chanSelect, bool skipDerived) const {
312  loadVar<int>(group, name, chanSelect, vdata, skipDerived);
313 }
314 
315 void ObsSpace::get_db(const std::string & group, const std::string & name,
316  std::vector<float> & vdata,
317  const std::vector<int> & chanSelect, bool skipDerived) const {
318  loadVar<float>(group, name, chanSelect, vdata, skipDerived);
319 }
320 
321 void ObsSpace::get_db(const std::string & group, const std::string & name,
322  std::vector<double> & vdata,
323  const std::vector<int> & chanSelect, bool skipDerived) const {
324  // load the float values from the database and convert to double
325  std::vector<float> floatData;
326  loadVar<float>(group, name, chanSelect, floatData, skipDerived);
327  ConvertVarType<float, double>(floatData, vdata);
328 }
329 
330 void ObsSpace::get_db(const std::string & group, const std::string & name,
331  std::vector<std::string> & vdata,
332  const std::vector<int> & chanSelect, bool skipDerived) const {
333  loadVar<std::string>(group, name, chanSelect, vdata, skipDerived);
334 }
335 
336 void ObsSpace::get_db(const std::string & group, const std::string & name,
337  std::vector<util::DateTime> & vdata,
338  const std::vector<int> & chanSelect, bool skipDerived) const {
339  std::vector<std::string> dtStrings;
340  loadVar<std::string>(group, name, chanSelect, dtStrings, skipDerived);
341  vdata = convertDtStringsToDtime(dtStrings);
342 }
343 
344 // -----------------------------------------------------------------------------
345 void ObsSpace::put_db(const std::string & group, const std::string & name,
346  const std::vector<int> & vdata,
347  const std::vector<std::string> & dimList) {
348  saveVar(group, name, vdata, dimList);
349 }
350 
351 void ObsSpace::put_db(const std::string & group, const std::string & name,
352  const std::vector<float> & vdata,
353  const std::vector<std::string> & dimList) {
354  saveVar(group, name, vdata, dimList);
355 }
356 
357 void ObsSpace::put_db(const std::string & group, const std::string & name,
358  const std::vector<double> & vdata,
359  const std::vector<std::string> & dimList) {
360  // convert to float, then save to the database
361  std::vector<float> floatData;
362  ConvertVarType<double, float>(vdata, floatData);
363  saveVar(group, name, floatData, dimList);
364 }
365 
366 void ObsSpace::put_db(const std::string & group, const std::string & name,
367  const std::vector<std::string> & vdata,
368  const std::vector<std::string> & dimList) {
369  saveVar(group, name, vdata, dimList);
370 }
371 
372 void ObsSpace::put_db(const std::string & group, const std::string & name,
373  const std::vector<util::DateTime> & vdata,
374  const std::vector<std::string> & dimList) {
375  std::vector<std::string> dtStrings(vdata.size(), "");
376  for (std::size_t i = 0; i < vdata.size(); ++i) {
377  dtStrings[i] = vdata[i].toString();
378  }
379  saveVar(group, name, dtStrings, dimList);
380 }
381 
382 // -----------------------------------------------------------------------------
383 const ObsSpace::RecIdxIter ObsSpace::recidx_begin() const {
384  return recidx_.begin();
385 }
386 
387 // -----------------------------------------------------------------------------
388 const ObsSpace::RecIdxIter ObsSpace::recidx_end() const {
389  return recidx_.end();
390 }
391 
392 // -----------------------------------------------------------------------------
393 bool ObsSpace::recidx_has(const std::size_t recNum) const {
394  RecIdxIter irec = recidx_.find(recNum);
395  return (irec != recidx_.end());
396 }
397 
398 // -----------------------------------------------------------------------------
399 std::size_t ObsSpace::recidx_recnum(const RecIdxIter & irec) const {
400  return irec->first;
401 }
402 
403 // -----------------------------------------------------------------------------
404 const std::vector<std::size_t> & ObsSpace::recidx_vector(const RecIdxIter & irec) const {
405  return irec->second;
406 }
407 
408 // -----------------------------------------------------------------------------
409 const std::vector<std::size_t> & ObsSpace::recidx_vector(const std::size_t recNum) const {
410  RecIdxIter Irec = recidx_.find(recNum);
411  if (Irec == recidx_.end()) {
412  std::string ErrMsg =
413  "ObsSpace::recidx_vector: Record number, " + std::to_string(recNum) +
414  ", does not exist in record index map.";
415  ABORT(ErrMsg);
416  }
417  return Irec->second;
418 }
419 
420 // -----------------------------------------------------------------------------
421 std::vector<std::size_t> ObsSpace::recidx_all_recnums() const {
422  std::vector<std::size_t> RecNums(nrecs_);
423  std::size_t recnum = 0;
424  for (RecIdxIter Irec = recidx_.begin(); Irec != recidx_.end(); ++Irec) {
425  RecNums[recnum] = Irec->first;
426  recnum++;
427  }
428  return RecNums;
429 }
430 
431 // ----------------------------- private functions -----------------------------
432 /*!
433  * \details This method provides a way to print an ObsSpace object in an output
434  * stream.
435  */
436 void ObsSpace::print(std::ostream & os) const {
437  std::size_t totalNlocs = this->globalNumLocs();
438  std::size_t nvars = this->obsvariables().size();
439  std::size_t nobs = totalNlocs * nvars;
440 
441  os << obsname() << ": nlocs: " << totalNlocs
442  << ", nvars: " << nvars << ", nobs: " << nobs;
443 }
444 
445 // -----------------------------------------------------------------------------
446 void ObsSpace::createObsGroupFromObsFrame(ObsFrameRead & obsFrame) {
447  // Determine the maximum frame size
448  Dimensions_t maxFrameSize = obs_params_.top_level_.obsIoInParameters().maxFrameSize;
449 
450  // Create the dimension specs for obs_group_
452  for (auto & dimNameObject : obsFrame.ioDimVarList()) {
453  std::string dimName = dimNameObject.first;
454  Variable srcDimVar = dimNameObject.second;
455  Dimensions_t dimSize = srcDimVar.getDimensions().dimsCur[0];
456  Dimensions_t maxDimSize = dimSize;
457  Dimensions_t chunkSize = dimSize;
458 
459  // If the dimension is nlocs, we want to avoid allocating the file's entire
460  // size because we could be taking a subset of the locations (MPI distribution,
461  // removal of obs outside the DA window).
462  //
463  // Make nlocs unlimited size, and start with its size limited by the
464  // max_frame_size parameter.
465  if (dimName == dim_info_.get_dim_name(ObsDimensionId::Nlocs)) {
466  if (dimSize > maxFrameSize) {
467  dimSize = maxFrameSize;
468  }
469  maxDimSize = Unlimited;
470  chunkSize = dimSize;
471  }
472 
473  if (srcDimVar.isA<int>()) {
474  newDims.push_back(ioda::NewDimensionScale<int>(
475  dimName, dimSize, maxDimSize, chunkSize));
476  } else if (srcDimVar.isA<float>()) {
477  newDims.push_back(ioda::NewDimensionScale<float>(
478  dimName, dimSize, maxDimSize, chunkSize));
479  }
480  }
481 
482  // Create the backend for obs_group_
483  Engines::BackendNames backendName = Engines::BackendNames::ObsStore; // Hdf5Mem; ObsStore;
485  // These parameters only matter if Hdf5Mem is the engine selected. ObsStore ignores.
488  backendParams.fileName = ioda::Engines::HH::genUniqueName();
489  backendParams.allocBytes = 1024*1024*50;
490  backendParams.flush = false;
491  Group backend = constructBackend(backendName, backendParams);
492 
493  // Create the ObsGroup and attach the backend.
495 
496  // fill in dimension coordinate values
497  for (auto & dimNameObject : obsFrame.ioDimVarList()) {
498  std::string dimName = dimNameObject.first;
499  Variable srcDimVar = dimNameObject.second;
500  Variable destDimVar = obs_group_.vars.open(dimName);
501 
502  // Set up the dimension selection objects. The prior loop declared the
503  // sizes of all the dimensions in the frame so use that as a guide, and
504  // transfer the first frame's worth of coordinate values accordingly.
505  std::vector<Dimensions_t> srcDimShape = srcDimVar.getDimensions().dimsCur;
506  std::vector<Dimensions_t> destDimShape = destDimVar.getDimensions().dimsCur;
507 
508  std::vector<Dimensions_t> counts = destDimShape;
509  std::vector<Dimensions_t> starts(counts.size(), 0);
510 
511  Selection srcSelect;
512  srcSelect.extent(srcDimShape).select({SelectionOperator::SET, starts, counts });
513  Selection memSelect;
514  memSelect.extent(destDimShape).select({SelectionOperator::SET, starts, counts });
515  Selection destSelect;
516  destSelect.extent(destDimShape).select({SelectionOperator::SET, starts, counts });
517 
518  if (srcDimVar.isA<int>()) {
519  std::vector<int> dimCoords;
520  srcDimVar.read<int>(dimCoords, memSelect, srcSelect);
521  destDimVar.write<int>(dimCoords, memSelect, destSelect);
522  } else if (srcDimVar.isA<float>()) {
523  std::vector<float> dimCoords;
524  srcDimVar.read<float>(dimCoords, memSelect, srcSelect);
525  destDimVar.write<float>(dimCoords, memSelect, destSelect);
526  }
527  }
528 }
529 
530 // -----------------------------------------------------------------------------
531 template<typename VarType>
532 bool ObsSpace::readObsSource(ObsFrameRead & obsFrame,
533  const std::string & varName, std::vector<VarType> & varValues) {
534  Variable sourceVar = obsFrame.vars().open(varName);
535 
536  // Read the variable
537  bool gotVarData = obsFrame.readFrameVar(varName, varValues);
538 
539  // Replace source fill values with corresponding missing marks
540  if ((gotVarData) && (sourceVar.hasFillValue())) {
541  VarType sourceFillValue;
542  detail::FillValueData_t sourceFvData = sourceVar.getFillValue();
543  sourceFillValue = detail::getFillValue<VarType>(sourceFvData);
544  VarType varFillValue = this->getFillValue<VarType>();
545  for (std::size_t i = 0; i < varValues.size(); ++i) {
546  if ((varValues[i] == sourceFillValue) || std::isinf(varValues[i])
547  || std::isnan(varValues[i])) {
548  varValues[i] = varFillValue;
549  }
550  }
551  }
552  return gotVarData;
553 }
554 
555 template<>
556 bool ObsSpace::readObsSource(ObsFrameRead & obsFrame,
557  const std::string & varName, std::vector<std::string> & varValues) {
558  Variable sourceVar = obsFrame.vars().open(varName);
559 
560  // Read the variable
561  bool gotVarData = obsFrame.readFrameVar(varName, varValues);
562 
563  // Replace source fill values with corresponding missing marks
564  if ((gotVarData) && (sourceVar.hasFillValue())) {
565  std::string sourceFillValue;
566  detail::FillValueData_t sourceFvData = sourceVar.getFillValue();
567  sourceFillValue = detail::getFillValue<std::string>(sourceFvData);
568  std::string varFillValue = this->getFillValue<std::string>();
569  for (std::size_t i = 0; i < varValues.size(); ++i) {
570  if (varValues[i] == sourceFillValue) {
571  varValues[i] = varFillValue;
572  }
573  }
574  }
575  return gotVarData;
576 }
577 
578 // -----------------------------------------------------------------------------
579 void ObsSpace::initFromObsSource(ObsFrameRead & obsFrame) {
580  // Walk through the frames and copy the data to the obs_group_ storage
581  dims_attached_to_vars_ = obsFrame.ioVarDimMap();
582 
583  // Create variables in obs_group_ based on those in the obs source
585 
587  int iframe = 1;
588  for (obsFrame.frameInit(); obsFrame.frameAvailable(); obsFrame.frameNext()) {
589  Dimensions_t frameStart = obsFrame.frameStart();
590 
591  // Resize the nlocs dimesion according to the adjusted frame size produced
592  // genFrameIndexRecNums. The second argument is to tell resizeNlocs whether
593  // to append or reset to the size given by the first arguemnt.
594  resizeNlocs(obsFrame.adjNlocsFrameCount(), (iframe > 1));
595 
596  // Clear out the selection caches
597  known_fe_selections_.clear();
598  known_be_selections_.clear();
599 
600  for (auto & varNameObject : obsFrame.ioVarList()) {
601  std::string varName = varNameObject.first;
602  Variable var = varNameObject.second;
603  Dimensions_t beFrameStart;
604  if (obsFrame.ioIsVarDimByNlocs(varName)) {
605  beFrameStart = obsFrame.adjNlocsFrameStart();
606  } else {
607  beFrameStart = frameStart;
608  }
609  Dimensions_t frameCount = obsFrame.frameCount(varName);
610 
611  // Transfer the variable to the in-memory storage
612  if (var.isA<int>()) {
613  std::vector<int> varValues;
614  if (readObsSource<int>(obsFrame, varName, varValues)) {
615  storeVar<int>(varName, varValues, beFrameStart, frameCount);
616  }
617  } else if (var.isA<float>()) {
618  std::vector<float> varValues;
619  if (readObsSource<float>(obsFrame, varName, varValues)) {
620  storeVar<float>(varName, varValues, beFrameStart, frameCount);
621  }
622  } else if (var.isA<std::string>()) {
623  std::vector<std::string> varValues;
624  if (readObsSource<std::string>(obsFrame, varName, varValues)) {
625  storeVar<std::string>(varName, varValues, beFrameStart, frameCount);
626  }
627  }
628  }
629  iframe++;
630  }
631 
632  // Record locations and channels dimension sizes
633  // The HDF library has an issue when a dimension marked UNLIMITED is queried for its
634  // size a zero is returned instead of the proper current size. As a workaround for this
635  // ask the frame how many locations it kept instead of asking the nlocs dimension for
636  // its size.
637  std::string nlocsName = dim_info_.get_dim_name(ObsDimensionId::Nlocs);
638  std::size_t nLocs = obsFrame.frameNumLocs();
640 
641  std::string nchansName = dim_info_.get_dim_name(ObsDimensionId::Nchans);
642  if (obs_group_.vars.exists(nchansName)) {
643  std::size_t nChans = obs_group_.vars.open(nchansName).getDimensions().dimsCur[0];
645  }
646 
647  // Record record information
648  nrecs_ = obsFrame.frameNumRecs();
649  indx_ = obsFrame.index();
650  recnums_ = obsFrame.recnums();
651 
652  // TODO(SRH) Eliminate this temporary fix. Some files do not have ISO 8601 date time
653  // strings. Instead they have a reference date time and time offset. If there is no
654  // datetime variable in the obs_group_ after reading in the file, then create one
655  // from the reference/offset time values.
656  std::string dtVarName = fullVarName("MetaData", "datetime");
657  if (!obs_group_.vars.exists(dtVarName)) {
658  int refDtime;
659  obsFrame.atts().open("date_time").read<int>(refDtime);
660 
661  std::vector<float> timeOffset;
662  Variable timeVar = obs_group_.vars.open(fullVarName("MetaData", "time"));
663  timeVar.read<float>(timeOffset);
664 
665  std::vector<util::DateTime> dtVals = convertRefOffsetToDtime(refDtime, timeOffset);
666  std::vector<std::string> dtStrings(dtVals.size(), "");
667  for (std::size_t i = 0; i < dtVals.size(); ++i) {
668  dtStrings[i] = dtVals[i].toString();
669  }
670 
672  params.chunk = true;
673  params.compressWithGZIP();
674  params.setFillValue<std::string>(this->getFillValue<std::string>());
675  std::vector<Variable>
678  .createWithScales<std::string>(dtVarName, dimVars, params)
679  .write<std::string>(dtStrings);
680  }
681 }
682 
683 // -----------------------------------------------------------------------------
684 void ObsSpace::resizeNlocs(const Dimensions_t nlocsSize, const bool append) {
686  Dimensions_t nlocsResize;
687  if (append) {
688  nlocsResize = nlocsVar.getDimensions().dimsCur[0] + nlocsSize;
689  } else {
690  nlocsResize = nlocsSize;
691  }
693  { std::pair<Variable, Dimensions_t>(nlocsVar, nlocsResize) });
694 }
695 
696 // -----------------------------------------------------------------------------
697 
698 template<typename VarType>
699 void ObsSpace::loadVar(const std::string & group, const std::string & name,
700  const std::vector<int> & chanSelect,
701  std::vector<VarType> & varValues,
702  bool skipDerived) const {
703  // For backward compatibility, recognize and handle appropriately variable names with
704  // channel suffixes.
705  std::string nameToUse;
706  std::vector<int> chanSelectToUse;
707  splitChanSuffix(group, name, chanSelect, nameToUse, chanSelectToUse);
708 
709  // Prefer variables from Derived* groups.
710  std::string groupToUse = "Derived" + group;
711  if (skipDerived || !obs_group_.vars.exists(fullVarName(groupToUse, nameToUse)))
712  groupToUse = group;
713 
714  // Try to open the variable.
715  ioda::Variable var = obs_group_.vars.open(fullVarName(groupToUse, nameToUse));
716 
717  std::string nchansVarName = this->get_dim_name(ObsDimensionId::Nchans);
718 
719  // In the following code, assume that if a variable has channels, the
720  // nchans dimension will be the second dimension.
721  if (obs_group_.vars.exists(nchansVarName)) {
722  Variable nchansVar = obs_group_.vars.open(nchansVarName);
723  if (var.getDimensions().dimensionality > 1) {
724  if (var.isDimensionScaleAttached(1, nchansVar) && (chanSelectToUse.size() > 0)) {
725  // This variable has nchans as the second dimension, and channel
726  // selection has been specified. Build selection objects based on the
727  // channel numbers. For now, select all locations (first dimension).
728  const std::size_t nchansDimIndex = 1;
729  Selection memSelect;
730  Selection obsGroupSelect;
731  const std::size_t numElements = createChannelSelections(
732  var, nchansDimIndex, chanSelectToUse, memSelect, obsGroupSelect);
733 
734  var.read<VarType>(varValues, memSelect, obsGroupSelect);
735  varValues.resize(numElements);
736  } else {
737  // Not a radiance variable, just read in the whole variable
738  var.read<VarType>(varValues);
739  }
740  } else {
741  // Not a radiance variable, just read in the whole variable
742  var.read<VarType>(varValues);
743  }
744  } else {
745  // Not a radiance variable, just read in the whole variable
746  var.read<VarType>(varValues);
747  }
748 }
749 
750 // -----------------------------------------------------------------------------
751 
752 template<typename VarType>
753 void ObsSpace::saveVar(const std::string & group, std::string name,
754  const std::vector<VarType> & varValues,
755  const std::vector<std::string> & dimList) {
756  // For backward compatibility, recognize and handle appropriately variable names with
757  // channel suffixes.
758 
759  std::vector<int> channels;
760 
761  const std::string nchansVarName = this->get_dim_name(ObsDimensionId::Nchans);
762  if (group != "MetaData" && obs_group_.vars.exists(nchansVarName)) {
763  // If the variable does not already exist and its name ends with an underscore followed by
764  // a number, interpret the latter as a channel number selecting a slice of the "nchans"
765  // dimension.
766  std::string nameToUse;
767  splitChanSuffix(group, name, {}, nameToUse, channels);
768  name = std::move(nameToUse);
769  }
770 
771  const std::string fullName = fullVarName(group, name);
772 
773  std::vector<std::string> dimListToUse = dimList;
774  if (!obs_group_.vars.exists(fullName) && !channels.empty()) {
775  // Append "channels" to the dimensions list if not already present.
776  const size_t nchansDimIndex =
777  std::find(dimListToUse.begin(), dimListToUse.end(), nchansVarName) -
778  dimListToUse.begin();
779  if (nchansDimIndex == dimListToUse.size())
780  dimListToUse.push_back(nchansVarName);
781  }
782  Variable var = openCreateVar<VarType>(fullName, dimListToUse);
783 
784  if (channels.empty()) {
785  var.write<VarType>(varValues);
786  } else {
787  // Find the index of the nchans dimension
788  Variable nchansVar = obs_group_.vars.open(nchansVarName);
789  std::vector<std::vector<Named_Variable>> dimScales =
790  var.getDimensionScaleMappings({Named_Variable(nchansVarName, nchansVar)});
791  size_t nchansDimIndex = std::find_if(dimScales.begin(), dimScales.end(),
792  [](const std::vector<Named_Variable> &x)
793  { return !x.empty(); }) - dimScales.begin();
794  if (nchansDimIndex == dimScales.size())
795  throw eckit::UserError("Variable " + fullName +
796  " is not indexed by channel numbers", Here());
797 
798  Selection memSelect;
799  Selection obsGroupSelect;
800  createChannelSelections(var, nchansDimIndex, channels,
801  memSelect, obsGroupSelect);
802  var.write<VarType>(varValues, memSelect, obsGroupSelect);
803  }
804 }
805 
806 // -----------------------------------------------------------------------------
807 
808 std::size_t ObsSpace::createChannelSelections(const Variable & variable,
809  std::size_t nchansDimIndex,
810  const std::vector<int> & channels,
811  Selection & memSelect,
812  Selection & obsGroupSelect) const {
813  // Create a vector with the channel indices corresponding to
814  // the channel numbers that have been requested.
815  std::vector<Dimensions_t> chanIndices;
816  chanIndices.reserve(channels.size());
817  for (std::size_t i = 0; i < channels.size(); ++i) {
818  auto ichan = chan_num_to_index_.find(channels[i]);
819  if (ichan != chan_num_to_index_.end()) {
820  chanIndices.push_back(ichan->second);
821  } else {
822  throw eckit::BadParameter("Selected channel number " +
823  std::to_string(channels[i]) + " does not exist.", Here());
824  }
825  }
826 
827  // Form index style selection for selecting channels
828  std::vector<Dimensions_t> varDims = variable.getDimensions().dimsCur;
829  std::vector<std::vector<Dimensions_t>> dimSelects(varDims.size());
830  Dimensions_t numElements = 1;
831  for (std::size_t i = 0; i < varDims.size(); ++i) {
832  if (i == nchansDimIndex) {
833  // channels are the second dimension
834  numElements *= chanIndices.size();
835  dimSelects[i] = chanIndices;
836  } else {
837  numElements *= varDims[i];
838  std::vector<Dimensions_t> allIndices(varDims[i]);
839  std::iota(allIndices.begin(), allIndices.end(), 0);
840  dimSelects[i] = allIndices;
841  }
842  }
843 
844  std::vector<Dimensions_t> memStarts(1, 0);
845  std::vector<Dimensions_t> memCounts(1, numElements);
846  memSelect.extent(memCounts)
847  .select({SelectionOperator::SET, memStarts, memCounts});
848 
849  // If numElements is zero, can't use the dimension selection style for
850  // the ObsStore backend. In this case use a hyperslab style selection with
851  // zero counts along each dimension which will produce the desired effect
852  // (of the selection specifying zero elements).
853  if (numElements == 0) {
854  // hyperslab style selection
855  std::vector<Dimensions_t> obsGroupStarts(varDims.size(), 0);
856  std::vector<Dimensions_t> obsGroupCounts(varDims.size(), 0);
857  obsGroupSelect.extent(varDims)
858  .select({SelectionOperator::SET, obsGroupStarts, obsGroupCounts});
859  } else {
860  // dimension style selection
861  obsGroupSelect.extent(varDims)
862  .select({SelectionOperator::SET, 0, dimSelects[0]});
863  for (std::size_t i = 1; i < dimSelects.size(); ++i) {
864  obsGroupSelect.select({SelectionOperator::AND, i, dimSelects[i]});
865  }
866  }
867 
868  return numElements;
869 }
870 
871 // -----------------------------------------------------------------------------
872 // This function is for transferring data from a memory buffer into the ObsSpace
873 // container. At this point, the time window filtering, obs grouping and MPI
874 // distribution has been applied to the input memory buffer (varValues). Also,
875 // the variable has been resized according to appending a new frame's worth of
876 // data to the existing variable in the ObsSpace container.
877 //
878 // What this means is that you can always transfer the data as a single contiguous
879 // block which can be accomplished with a single hyperslab selection. There should
880 // be no need to cache these selections because of this.
881 template<typename VarType>
882 void ObsSpace::storeVar(const std::string & varName, std::vector<VarType> & varValues,
883  const Dimensions_t frameStart, const Dimensions_t frameCount) {
884  // get the dimensions of the variable
885  Variable var = obs_group_.vars.open(varName);
886  std::vector<Dimensions_t> varDims = var.getDimensions().dimsCur;
887 
888  // check the caches for the selectors
889  std::vector<std::string> &dims = dims_attached_to_vars_.at(varName);
890  if (!known_fe_selections_.count(dims)) {
891  // backend starts at frameStart, and the count for the first dimension
892  // is the frame count
893  std::vector<Dimensions_t> beCounts = varDims;
894  beCounts[0] = frameCount;
895  std::vector<Dimensions_t> beStarts(beCounts.size(), 0);
896  beStarts[0] = frameStart;
897 
898  // front end always starts at zero, and the number of elements is equal to the
899  // product of the var dimensions (with the first dimension adjusted by
900  // the frame count)
901  std::vector<Dimensions_t> feCounts(1, std::accumulate(
902  beCounts.begin(), beCounts.end(), static_cast<Dimensions_t>(1),
903  std::multiplies<Dimensions_t>()));
904  std::vector<Dimensions_t> feStarts(1, 0);
905 
907  .extent(feCounts).select({ SelectionOperator::SET, feStarts, feCounts });
909  .extent(varDims).select({ SelectionOperator::SET, beStarts, beCounts });
910  }
911  Selection & feSelect = known_fe_selections_[dims];
912  Selection & beSelect = known_be_selections_[dims];
913 
914  var.write<VarType>(varValues, feSelect, beSelect);
915 }
916 
917 // -----------------------------------------------------------------------------
918 // NOTE(RH): Variable creation params rewritten so they are constructed once for each type.
919 // There is no need to keep re-creating the same objects over and over again.
920 // TODO(?): Rewrite slightly so that the scales are opened all at once and are kept
921 // open until the end of the function.
922 // TODO(?): Batch variable creation so that the collective function is used.
923 void ObsSpace::createVariables(const Has_Variables & srcVarContainer,
924  Has_Variables & destVarContainer,
925  const VarDimMap & dimsAttachedToVars) {
926  // Set up reusable creation parameters for the loop below. Use the JEDI missing
927  // values for the fill values.
928  VariableCreationParameters paramsInt = VariableCreationParameters::defaults<int>();
929  VariableCreationParameters paramsFloat = VariableCreationParameters::defaults<float>();
930  VariableCreationParameters paramsStr = VariableCreationParameters::defaults<std::string>();
931 
932  paramsInt.setFillValue<int>(this->getFillValue<int>());
933  paramsFloat.setFillValue<float>(this->getFillValue<float>());
934  paramsStr.setFillValue<std::string>(this->getFillValue<std::string>());
935 
936  // Walk through map to get list of variables to create along with
937  // their dimensions. Use the srcVarContainer to get the var data type.
938  for (auto & ivar : dimsAttachedToVars) {
939  std::string varName = ivar.first;
940  std::vector<std::string> varDimNames = ivar.second;
941 
942  // Create a vector with dimension scale vector from destination container
943  std::vector<Variable> varDims;
944  for (auto & dimVarName : varDimNames) {
945  varDims.push_back(destVarContainer.open(dimVarName));
946  }
947 
948  Variable srcVar = srcVarContainer.open(varName);
949  if (srcVar.isA<int>()) {
950  destVarContainer.createWithScales<int>(varName, varDims, paramsInt);
951  } else if (srcVar.isA<float>()) {
952  destVarContainer.createWithScales<float>(varName, varDims, paramsFloat);
953  } else if (srcVar.isA<std::string>()) {
954  destVarContainer.createWithScales<std::string>(varName, varDims, paramsStr);
955  } else {
956  if (this->comm().rank() == 0) {
957  oops::Log::warning() << "WARNING: ObsSpace::createVariables: "
958  << "Skipping variable due to an unexpected data type for variable: "
959  << varName << std::endl;
960  }
961  }
962  }
963 }
964 
965 // -----------------------------------------------------------------------------
966 void ObsSpace::fillChanNumToIndexMap() {
967  // If there is a channels dimension, load up the channel number to index map
968  // for channel selection feature.
969  std::string nchansVarName = this->get_dim_name(ObsDimensionId::Nchans);
970  if (obs_group_.vars.exists(nchansVarName)) {
971  // Get the vector of channel numbers
972  Variable nchansVar = obs_group_.vars.open(nchansVarName);
973  std::vector<int> chanNumbers;
974  if (nchansVar.isA<int>()) {
975  nchansVar.read<int>(chanNumbers);
976  } else if (nchansVar.isA<float>()) {
977  std::vector<float> floatChanNumbers;
978  nchansVar.read<float>(floatChanNumbers);
979  ConvertVarType<float, int>(floatChanNumbers, chanNumbers);
980  }
981 
982  // Walk through the vector and place the number to index mapping into
983  // the map structure.
984  for (int i = 0; i < chanNumbers.size(); ++i) {
985  chan_num_to_index_[chanNumbers[i]] = i;
986  }
987  }
988 }
989 
990 // -----------------------------------------------------------------------------
991 void ObsSpace::splitChanSuffix(const std::string & group, const std::string & name,
992  const std::vector<int> & chanSelect, std::string & nameToUse,
993  std::vector<int> & chanSelectToUse,
994  bool skipDerived) const {
995  nameToUse = name;
996  chanSelectToUse = chanSelect;
997  // For backward compatibility, recognize and handle appropriately variable names with
998  // channel suffixes.
999  if (chanSelect.empty() &&
1000  !obs_group_.vars.exists(fullVarName(group, name)) &&
1001  (skipDerived || !obs_group_.vars.exists(fullVarName("Derived" + group, name)))) {
1002  int channelNumber;
1003  if (extractChannelSuffixIfPresent(name, nameToUse, channelNumber))
1004  chanSelectToUse = {channelNumber};
1005  }
1006 }
1007 
1008 // -----------------------------------------------------------------------------
1009 void ObsSpace::buildSortedObsGroups() {
1010  typedef std::map<std::size_t, std::vector<std::pair<float, std::size_t>>> TmpRecIdxMap;
1011  typedef TmpRecIdxMap::iterator TmpRecIdxIter;
1012 
1013  // Get the sort variable from the data store, and convert to a vector of floats.
1014  std::size_t nLocs = this->nlocs();
1015  std::vector<float> SortValues(nLocs);
1016  if (this->obs_sort_var() == "datetime") {
1017  std::vector<util::DateTime> Dates(nLocs);
1018  get_db("MetaData", this->obs_sort_var(), Dates);
1019  for (std::size_t iloc = 0; iloc < nLocs; iloc++) {
1020  SortValues[iloc] = (Dates[iloc] - Dates[0]).toSeconds();
1021  }
1022  } else {
1023  get_db("MetaData", this->obs_sort_var(), SortValues);
1024  }
1025 
1026  // Construct a temporary structure to do the sorting, then transfer the results
1027  // to the data member recidx_.
1028  TmpRecIdxMap TmpRecIdx;
1029  for (size_t iloc = 0; iloc < nLocs; iloc++) {
1030  TmpRecIdx[recnums_[iloc]].push_back(std::make_pair(SortValues[iloc], iloc));
1031  }
1032 
1033  for (TmpRecIdxIter irec = TmpRecIdx.begin(); irec != TmpRecIdx.end(); ++irec) {
1034  if (this->obs_sort_order() == "ascending") {
1035  sort(irec->second.begin(), irec->second.end());
1036  } else {
1037  // Use a lambda function to access the std::pair greater-than operator to
1038  // implement a descending order sort, ensuring the associated indices remain
1039  // in ascending order.
1040  sort(irec->second.begin(), irec->second.end(),
1041  [](const std::pair<float, std::size_t> & p1,
1042  const std::pair<float, std::size_t> & p2){
1043  return (p2.first < p1.first ||
1044  (!(p1.first < p2.first) && p2.second > p1.second));});
1045  }
1046  }
1047 
1048  // Copy indexing to the recidx_ data member.
1049  for (TmpRecIdxIter irec = TmpRecIdx.begin(); irec != TmpRecIdx.end(); ++irec) {
1050  recidx_[irec->first].resize(irec->second.size());
1051  for (std::size_t iloc = 0; iloc < irec->second.size(); iloc++) {
1052  recidx_[irec->first][iloc] = irec->second[iloc].second;
1053  }
1054  }
1055 }
1056 
1057 // -----------------------------------------------------------------------------
1058 void ObsSpace::buildRecIdxUnsorted() {
1059  std::size_t nLocs = this->nlocs();
1060  for (size_t iloc = 0; iloc < nLocs; iloc++) {
1061  recidx_[recnums_[iloc]].push_back(iloc);
1062  }
1063 }
1064 
1065 // -----------------------------------------------------------------------------
1066 void ObsSpace::saveToFile() {
1067  // Form lists of regular and dimension scale variables
1068  VarNameObjectList varList;
1069  VarNameObjectList dimVarList;
1070  VarDimMap dimsAttachedToVars;
1071  Dimensions_t maxVarSize;
1072  collectVarDimInfo(obs_group_, varList, dimVarList, dimsAttachedToVars, maxVarSize);
1073 
1074  // Record dimension scale variables for the output file creation.
1075  for (auto & dimNameObject : dimVarList) {
1076  std::string dimName = dimNameObject.first;
1077  Dimensions_t dimSize = dimNameObject.second.getDimensions().dimsCur[0];
1078  Dimensions_t dimMaxSize = dimSize;
1079  Dimensions_t dimChunkSize = dimSize;
1080  if (dimName == dim_info_.get_dim_name(ObsDimensionId::Nlocs)) {
1081  dimSize = this->nlocs();
1082  dimMaxSize = Unlimited;
1083  dimChunkSize = this->globalNumLocs();
1084  }
1085  // It's possible that dimChunkSize is set to zero which is an illegal value
1086  // for the chunk size. If the current dimension size is zero, then it's okay
1087  // to set chunk size to an arbitrary small size since you don't need to be
1088  // particularly efficient about it.
1089  if (dimChunkSize == 0) {
1090  dimChunkSize = 5;
1091  }
1092  obs_params_.setDimScale(dimName, dimSize, dimMaxSize, dimChunkSize);
1093  }
1094 
1095  // Record the maximum variable size
1096  obs_params_.setMaxVarSize(maxVarSize);
1097 
1098  // Open the file for output
1099  ObsFrameWrite obsFrame(obs_params_);
1100 
1101  // Iterate through the frames and variables moving data from the database into
1102  // the file.
1103  int iframe = 0;
1104  for (obsFrame.frameInit(varList, dimVarList, dimsAttachedToVars, maxVarSize);
1105  obsFrame.frameAvailable(); obsFrame.frameNext(varList)) {
1106  Dimensions_t frameStart = obsFrame.frameStart();
1107  for (auto & varNameObject : varList) {
1108  // form the destination (ObsFrame) variable name
1109  std::string destVarName = varNameObject.first;
1110 
1111  // open the destination variable and get the associated count
1112  Variable destVar = obsFrame.vars().open(destVarName);
1113  Dimensions_t frameCount = obsFrame.frameCount(destVarName);
1114 
1115  // transfer data if we haven't gone past the end of the variable yet
1116  if (frameCount > 0) {
1117  // Form the hyperslab selection for this frame
1118  Variable srcVar = varNameObject.second;
1119  std::vector<Dimensions_t> varShape = srcVar.getDimensions().dimsCur;
1120  ioda::Selection memSelect = obsFrame.createMemSelection(varShape, frameCount);
1121  ioda::Selection varSelect =
1122  obsFrame.createVarSelection(varShape, frameStart, frameCount);
1123 
1124  // transfer the data
1125  if (srcVar.isA<int>()) {
1126  std::vector<int> varValues;
1127  srcVar.read<int>(varValues, memSelect, varSelect);
1128  obsFrame.writeFrameVar(destVarName, varValues);
1129  } else if (srcVar.isA<float>()) {
1130  std::vector<float> varValues;
1131  srcVar.read<float>(varValues, memSelect, varSelect);
1132  obsFrame.writeFrameVar(destVarName, varValues);
1133  } else if (srcVar.isA<std::string>()) {
1134  std::vector<std::string> varValues;
1135  srcVar.read<std::string>(varValues, memSelect, varSelect);
1136  obsFrame.writeFrameVar(destVarName, varValues);
1137  }
1138  }
1139  }
1140  }
1141 }
1142 
1143 // -----------------------------------------------------------------------------
1144 template <typename DataType>
1145 void ObsSpace::extendVariable(Variable & extendVar,
1146  const size_t upperBoundOnGlobalNumOriginalRecs) {
1147  const DataType missing = util::missingValue(missing);
1148 
1149  // Read in variable data values. At this point the values will contain
1150  // the extended region filled with missing values. The read call will size
1151  // the varVals vector accordingly.
1152  std::vector<DataType> varVals;
1153  extendVar.read<DataType>(varVals);
1154 
1155  for (const auto & recordindex : recidx_) {
1156  // Only deal with records in the original ObsSpace.
1157  if (recordindex.first >= upperBoundOnGlobalNumOriginalRecs) break;
1158 
1159  // Find the first non-missing value in the original record.
1160  DataType fillValue = missing;
1161  for (const auto & jloc : recordindex.second) {
1162  if (varVals[jloc] != missing) {
1163  fillValue = varVals[jloc];
1164  break;
1165  }
1166  }
1167 
1168  // Fill the averaged record with the first non-missing value in the original record.
1169  // (If all values are missing, do nothing.)
1170  if (fillValue != missing) {
1171  for (const auto & jloc : recidx_[recordindex.first + upperBoundOnGlobalNumOriginalRecs]) {
1172  varVals[jloc] = fillValue;
1173  }
1174  }
1175  }
1176 
1177  // Write out values of the averaged record.
1178  extendVar.write<DataType>(varVals);
1179 }
1180 
1181 // -----------------------------------------------------------------------------
1182 void ObsSpace::extendObsSpace(const ObsExtendParameters & params) {
1183  // In this function we use the following terminology:
1184  // * The word 'original' refers to locations and records present in the ObsSpace before its
1185  // extension.
1186  // * The word 'averaged' refers to locations and records created when extending the ObsSpace
1187  // (they will represent data averaged onto model levels).
1188  // * The word 'extended' refers to the original and averaged locations and records taken
1189  // together.
1190  // * The word 'local` refers to locations and records held on the current process.
1191  // * The word 'global` refers to locations and records held on any process.
1192 
1193  const int nlevs = params.numModelLevels;
1194 
1195  const size_t numOriginalLocs = this->nlocs();
1196  const bool recordsExist = !this->obs_group_vars().empty();
1197  if (nlevs > 0 &&
1198  gnlocs_ > 0 &&
1199  recordsExist) {
1200  // Identify the indices of all local original records.
1201  const std::set<size_t> uniqueOriginalRecs(recnums_.begin(), recnums_.end());
1202 
1203  // Find the largest global indices of locations and records in the original ObsSpace.
1204  // Increment them by one to produce the initial values for the global indices of locations
1205  // and records in the averaged ObsSpace.
1206 
1207  // These are *upper bounds* on the global numbers of original locations and records
1208  // because the sequences of global location indices and records may contain gaps.
1209  size_t upperBoundOnGlobalNumOriginalLocs = 0;
1210  size_t upperBoundOnGlobalNumOriginalRecs = 0;
1211  if (numOriginalLocs > 0) {
1212  upperBoundOnGlobalNumOriginalLocs = indx_.back() + 1;
1213  upperBoundOnGlobalNumOriginalRecs = *uniqueOriginalRecs.rbegin() + 1;
1214  }
1215  dist_->max(upperBoundOnGlobalNumOriginalLocs);
1216  dist_->max(upperBoundOnGlobalNumOriginalRecs);
1217 
1218  // The replica distribution will be used to place each averaged record on the same process
1219  // as the corresponding original record.
1220  std::shared_ptr<Distribution> replicaDist = createReplicaDistribution(
1221  commMPI_, dist_, recnums_);
1222 
1223  // Create averaged locations and records.
1224 
1225  // Local index of an averaged location. Note that these indices, like local indices of
1226  // original locations, start from 0.
1227  size_t averagedLoc = 0;
1228  for (size_t originalRec : uniqueOriginalRecs) {
1229  ASSERT(dist_->isMyRecord(originalRec));
1230  const size_t averagedRec = originalRec;
1231  const size_t extendedRec = upperBoundOnGlobalNumOriginalRecs + averagedRec;
1232  nrecs_++;
1233  // recidx_ stores the locations belonging to each record on the local processor.
1234  std::vector<size_t> &locsInRecord = recidx_[extendedRec];
1235  for (int ilev = 0; ilev < nlevs; ++ilev, ++averagedLoc) {
1236  const size_t extendedLoc = numOriginalLocs + averagedLoc;
1237  const size_t globalAveragedLoc = originalRec * nlevs + ilev;
1238  const size_t globalExtendedLoc = upperBoundOnGlobalNumOriginalLocs + globalAveragedLoc;
1239  // Geographical position shouldn't matter -- the replica distribution is expected
1240  // to assign records to processors solely on the basis of their indices.
1241  replicaDist->assignRecord(averagedRec, globalAveragedLoc, eckit::geometry::Point2());
1242  ASSERT(replicaDist->isMyRecord(averagedRec));
1243  recnums_.push_back(extendedRec);
1244  indx_.push_back(globalExtendedLoc);
1245  locsInRecord.push_back(extendedLoc);
1246  }
1247  }
1248  replicaDist->computePatchLocs();
1249 
1250  const size_t numAveragedLocs = averagedLoc;
1251  const size_t numExtendedLocs = numOriginalLocs + numAveragedLocs;
1252 
1253  // Extend all existing vectors with missing values.
1254  // Only vectors with (at least) one dimension equal to nlocs are modified.
1255  // Second argument (bool) to resizeNlocs tells function:
1256  // true -> append the amount in first argument to the existing size
1257  // false -> reset the existing size to the amount in the first argument
1258  this->resizeNlocs(numExtendedLocs, false);
1259 
1260  // Extend all existing vectors with missing values, excepting those
1261  // that have been selected to be filled with non-missing values.
1262  // By default, some spatial and temporal coordinates are filled in this way.
1263  //
1264  // The resizeNlocs() call above has extended all variables with nlocs as a first
1265  // dimension to the new nlocsext size, and filled all the extended parts with
1266  // missing values. Go through the list of variables that are to be filled with
1267  // non-missing values, check if they exist and if so fill in the extended section
1268  // with non-missing values.
1269  const std::vector <std::string> &nonMissingExtendedVars = params.nonMissingExtendedVars;
1270  for (auto & varName : nonMissingExtendedVars) {
1271  // It is implied that these variables are in the MetaData group
1272  const std::string groupName = "MetaData";
1273  const std::string fullVname = fullVarName(groupName, varName);
1274  if (obs_group_.vars.exists(fullVname)) {
1275  // Note nlocs at this point holds the original size before extending.
1276  // The numOriginalLocs argument passed to extendVariable indicates where to start filling.
1277  Variable extendVar = obs_group_.vars.open(fullVname);
1278  if (extendVar.isA<int>()) {
1279  extendVariable<int>(extendVar, upperBoundOnGlobalNumOriginalRecs);
1280  } else if (extendVar.isA<float>()) {
1281  extendVariable<float>(extendVar, upperBoundOnGlobalNumOriginalRecs);
1282  } else if (extendVar.isA<std::string>()) {
1283  extendVariable<std::string>(extendVar, upperBoundOnGlobalNumOriginalRecs);
1284  }
1285  }
1286  }
1287 
1288  // Fill extended_obs_space with 0, which indicates the standard section of the ObsSpace,
1289  // and 1, which indicates the extended section.
1290  std::vector <int> extended_obs_space(numExtendedLocs, 0);
1291  std::fill(extended_obs_space.begin() + numOriginalLocs, extended_obs_space.end(), 1);
1292  // Save extended_obs_space for use in filters.
1293  put_db("MetaData", "extended_obs_space", extended_obs_space);
1294 
1295  // Calculate the number of newly created locations on all processes (counting those
1296  // held on multiple processes only once).
1297  std::unique_ptr<Accumulator<size_t>> accumulator = replicaDist->createAccumulator<size_t>();
1298  for (size_t averagedLoc = 0; averagedLoc < numAveragedLocs; ++averagedLoc)
1299  accumulator->addTerm(averagedLoc, 1);
1300  size_t globalNumAveragedLocs = accumulator->computeResult();
1301 
1302  // Replace the original distribution with a PairOfDistributions, covering
1303  // both the original and averaged locations.
1304  dist_ = std::make_shared<PairOfDistributions>(commMPI_, dist_, replicaDist,
1305  numOriginalLocs,
1306  upperBoundOnGlobalNumOriginalRecs);
1307 
1308  // Increment nlocs on this processor.
1309  dim_info_.set_dim_size(ObsDimensionId::Nlocs, numExtendedLocs);
1310  // Increment gnlocs_.
1311  gnlocs_ += globalNumAveragedLocs;
1312  }
1313 }
1314 
1315 // -----------------------------------------------------------------------------
1316 void ObsSpace::createMissingObsErrors() {
1317  std::vector<float> obserror; // Will be initialized only if necessary
1318 
1319  for (size_t i = 0; i < obsvars_.size(); ++i) {
1320  if (!has("ObsError", obsvars_[i])) {
1321  if (obserror.empty())
1322  obserror.assign(nlocs(), util::missingValue(float()));
1323  put_db("DerivedObsError", obsvars_[i], obserror);
1324  }
1325  }
1326 }
1327 // -----------------------------------------------------------------------------
1328 
1329 } // namespace ioda
HDF5 engine.
Interfaces for ioda::Variable and related classes.
Groups are a new implementation of ObsSpaces.
Definition: Group.h:159
This class exists inside of ioda::Group and provides the interface to manipulating Variables.
void set_dim_size(const ObsDimensionId dimId, std::size_t dimSize)
set the dimension size for the given dimension id
Definition: ObsSpace.cc:92
std::string get_dim_name(const ObsDimensionId dimId) const
return the dimension name for the given dimension id
Definition: ObsSpace.cc:84
ObsDimensionId get_dim_id(const std::string &dimName) const
return the standard id value for the given dimension name
Definition: ObsSpace.cc:80
std::map< ObsDimensionId, std::size_t > dim_id_size_
map going from dim id to dim size
Definition: src/ObsSpace.h:87
std::size_t get_dim_size(const ObsDimensionId dimId) const
return the dimension size for the given dimension id
Definition: ObsSpace.cc:88
std::map< std::string, ObsDimensionId > dim_name_id_
map going from dim name to id
Definition: src/ObsSpace.h:90
std::map< ObsDimensionId, std::string > dim_id_name_
map going from dim id to dim name
Definition: src/ObsSpace.h:84
bool ioIsVarDimByNlocs(const std::string &varName) const
return true if variable is dimensioned by nlocs
Definition: ObsFrame.h:76
Selection createMemSelection(const std::vector< Dimensions_t > &varShape, const Dimensions_t frameCount)
create selection object for accessing a memory buffer
Definition: ObsFrame.cc:26
virtual std::size_t frameNumLocs() const
return number of locations
Definition: ObsFrame.h:81
const VarNameObjectList & ioVarList() const
return list of regular variables from ObsIo
Definition: ObsFrame.h:64
VarDimMap ioVarDimMap() const
return map from variables to their attached dimension scales
Definition: ObsFrame.h:70
Dimensions_t globalNumLocs() const
return number of locations that were selected from ObsIo
Definition: ObsFrame.h:87
const VarNameObjectList & ioDimVarList() const
return list of dimension scale variables from ObsIo
Definition: ObsFrame.h:67
Selection createVarSelection(const std::vector< Dimensions_t > &varShape, const Dimensions_t frameStart, const Dimensions_t frameCount)
create selection object for accessing a frame from a whole variable
Definition: ObsFrame.cc:72
Has_Attributes & atts() const
return attributes container from ObsIo
Definition: ObsFrame.h:61
Dimensions_t globalNumLocsOutsideTimeWindow() const
return number of locations from obs source that were outside the time window
Definition: ObsFrame.h:90
Has_Variables & vars() const
return variables container from ObsIo
Definition: ObsFrame.h:58
virtual std::size_t frameNumRecs() const
return number of records
Definition: ObsFrame.h:84
Implementation of ObsFrameRead class.
std::vector< std::size_t > index() const override
return list of indices indicating which locations were selected from ObsIo
void frameNext() override
move to the next frame
Definition: ObsFrameRead.cc:75
Dimensions_t frameCount(const std::string &varName) override
return current frame count for variable
Dimensions_t adjNlocsFrameCount() const override
return adjusted nlocs frame count
bool frameAvailable() override
true if a frame is available (not past end of frames)
Definition: ObsFrameRead.cc:81
void frameInit() override
initialize for walking through the frames
Definition: ObsFrameRead.cc:50
bool readFrameVar(const std::string &varName, std::vector< int > &varData)
read a frame variable
Dimensions_t frameStart() override
return current frame starting index
Dimensions_t adjNlocsFrameStart() const override
return adjusted nlocs frame start
std::shared_ptr< const Distribution > distribution()
return the MPI distribution
std::vector< std::size_t > recnums() const override
return list of record numbers from ObsIo
Implementation of ObsFrameWrite class.
void writeFrameVar(const std::string &varName, const std::vector< int > &varData)
write a frame variable
void frameNext(const VarNameObjectList &varList) override
move to the next frame
Dimensions_t frameCount(const std::string &varName) override
return current frame count for variable
void frameInit(const VarNameObjectList &varList, const VarNameObjectList &dimVarList, const VarDimMap &varDimMap, const Dimensions_t maxVarSize) override
initialize for walking through the frames
bool frameAvailable() override
true if a frame is available (not past end of frames)
Dimensions_t frameStart() override
return current frame starting index
static ObsGroup generate(Group &emptyGroup, const NewDimensionScales_t &fundamentalDims, std::shared_ptr< const detail::DataLayoutPolicy > layout=nullptr)
Create an empty ObsGroup and populate it with the fundamental dimensions.
Definition: ObsGroup.cpp:72
void resize(const std::vector< std::pair< Variable, ioda::Dimensions_t >> &newDims)
Resize a Dimension and every Variable that depends on it.
Definition: ObsGroup.cpp:85
oops::Parameter< ObsGroupingParameters > obsGrouping
options controlling obs record grouping
oops::Parameter< int > maxFrameSize
maximum frame size
void extendObsSpace(const ObsExtendParameters &params)
Extend the ObsSpace according to the method requested in the configuration file.
Definition: ObsSpace.cc:1182
void createVariables(const Has_Variables &srcVarContainer, Has_Variables &destVarContainer, const VarDimMap &dimsAttachedToVars)
create set of variables from source variables and lists
Definition: ObsSpace.cc:923
void saveToFile()
Dump the database into the output file.
Definition: ObsSpace.cc:1066
const std::vector< std::size_t > & recnum() const
return reference to the record number vector
Definition: src/ObsSpace.h:223
void put_db(const std::string &group, const std::string &name, const std::vector< int > &vdata, const std::vector< std::string > &dimList={ "nlocs" })
transfer data from vdata to the obs container
std::shared_ptr< const Distribution > dist_
MPI distribution object.
Definition: src/ObsSpace.h:403
void get_db(const std::string &group, const std::string &name, std::vector< int > &vdata, const std::vector< int > &chanSelect={ }, bool skipDerived=false) const
transfer data from the obs container to vdata
std::size_t gnlocs_outside_timewindow_
number of nlocs from the obs source that are outside the time window
Definition: src/ObsSpace.h:378
void buildRecIdxUnsorted()
Create the recidx data structure with unsorted record groups.
Definition: ObsSpace.cc:1058
ObsDimInfo dim_info_
dimension information for variables in this obs space
Definition: src/ObsSpace.h:384
void splitChanSuffix(const std::string &group, const std::string &name, const std::vector< int > &chanSelect, std::string &nameToUse, std::vector< int > &chanSelectToUse, bool skipDerived=false) const
split off the channel number suffix from a given variable name
Definition: ObsSpace.cc:991
VarDimMap dims_attached_to_vars_
map showing association of dim names with each variable name
Definition: src/ObsSpace.h:418
bool has(const std::string &group, const std::string &name, bool skipDerived=false) const
return true if variable name exists in group group or (unless skipDerived is set to true) "Derived" +...
Definition: ObsSpace.cc:263
std::string get_dim_name(const ObsDimensionId dimId) const
return the standard dimension name for the given dimension id
Definition: src/ObsSpace.h:193
void createObsGroupFromObsFrame(ObsFrameRead &obsFrame)
Initialize the database from a source (ObsFrame ojbect)
Definition: ObsSpace.cc:446
std::string obsname_
name of obs space
Definition: src/ObsSpace.h:397
std::size_t nrecs_
number of records
Definition: src/ObsSpace.h:381
const std::vector< std::string > & obs_group_vars() const
return YAML configuration parameter: obsdatain.obsgrouping.group variables
Definition: ObsSpace.cc:243
oops::Variables obsvars_
Observation "variables" to be simulated.
Definition: src/ObsSpace.h:400
std::map< int, int > chan_num_to_index_
map to go from channel number (not necessarily consecutive) to channel index (consecutive,...
Definition: src/ObsSpace.h:388
void saveVar(const std::string &group, std::string name, const std::vector< VarType > &varValues, const std::vector< std::string > &dimList)
save a variable to the obs_group_ object
const eckit::mpi::Comm & comm() const
Definition: src/ObsSpace.h:149
void initFromObsSource(ObsFrameRead &obsFrame)
initialize the in-memory obs_group_ (ObsGroup) object from the ObsIo source
Definition: ObsSpace.cc:579
RecIdxMap::const_iterator RecIdxIter
Definition: src/ObsSpace.h:120
void createMissingObsErrors()
For each simulated variable that doesn't have an accompanying array in the ObsError or DerivedObsErro...
Definition: ObsSpace.cc:1316
RecIdxMap recidx_
profile ordering
Definition: src/ObsSpace.h:412
ObsSpaceParameters obs_params_
obs io parameters
Definition: src/ObsSpace.h:394
void buildSortedObsGroups()
Create the recidx data structure holding sorted record groups.
Definition: ObsSpace.cc:1009
ObsGroup obs_group_
observation data store
Definition: src/ObsSpace.h:391
std::vector< std::size_t > indx_
indexes of locations to extract from the input obs file
Definition: src/ObsSpace.h:406
void fillChanNumToIndexMap()
fill in the channel number to channel index map
Definition: ObsSpace.cc:966
std::string obs_sort_order() const
return YAML configuration parameter: obsdatain.obsgrouping.sort order
Definition: ObsSpace.cc:253
void resizeNlocs(const Dimensions_t nlocsSize, const bool append)
resize along nlocs dimension
Definition: ObsSpace.cc:684
std::size_t createChannelSelections(const Variable &variable, std::size_t nchansDimIndex, const std::vector< int > &channels, Selection &memSelect, Selection &obsGroupSelect) const
Create selections of slices of the variable variable along dimension nchansDimIndex corresponding to ...
Definition: ObsSpace.cc:808
bool recidx_is_sorted_
indicator whether the data in recidx_ is sorted
Definition: src/ObsSpace.h:415
std::size_t globalNumLocsOutsideTimeWindow() const
return number of locations from obs source that were outside the time window
Definition: src/ObsSpace.h:172
const eckit::mpi::Comm & commMPI_
MPI communicator.
Definition: src/ObsSpace.h:372
std::size_t globalNumLocs() const
return the total number of locations in the corresponding obs spaces across all MPI tasks
Definition: src/ObsSpace.h:169
std::size_t gnlocs_
total number of locations
Definition: src/ObsSpace.h:375
std::map< std::vector< std::string >, Selection > known_be_selections_
cache for backend selection
Definition: src/ObsSpace.h:424
const oops::Variables & obsvariables() const
return the collection of all simulated variables
Definition: src/ObsSpace.h:349
const std::string & obsname() const
return the name of the obs type being stored
Definition: src/ObsSpace.h:217
std::string obs_sort_var() const
return YAML configuration parameter: obsdatain.obsgrouping.sort variable
Definition: ObsSpace.cc:248
std::map< std::vector< std::string >, Selection > known_fe_selections_
cache for frontend selection
Definition: src/ObsSpace.h:421
std::vector< std::size_t > recnums_
record numbers associated with the location indexes
Definition: src/ObsSpace.h:409
void setMaxVarSize(const Dimensions_t maxVarSize)
set the maximum variable size
ObsTopLevelParameters top_level_
sub groups of parameters
void setDimScale(const std::string &dimName, const Dimensions_t curSize, const Dimensions_t maxSize, const Dimensions_t chunkSize)
set a new dimension scale
oops::RequiredParameter< oops::Variables > simVars
simulated variables
oops::OptionalParameter< ObsExtendParameters > obsExtend
extend the ObsSpace with extra fixed-size records
oops::RequiredParameter< std::string > obsSpaceName
name of obs space
oops::Parameter< bool > saveObsDistribution
oops::OptionalParameter< ObsFileOutParameters > obsOutFile
output specification by writing to a file
oops::Parameter< oops::Variables > derivedSimVars
oops::Parameter< std::string > distName
name of MPI distribution
const ObsIoParametersBase & obsIoInParameters() const
parameters indicating where to load data from
A Selection represents the bounds of the data, in ioda or in userspace, that you are reading or writi...
Definition: Selection.h:48
Variables store data!
Definition: Variable.h:680
virtual Attribute_Implementation read(gsl::span< char > data, const Type &in_memory_dataType) const
The fundamental read function. Backends overload this function to implement all read operations.
Definition: Attribute.cpp:75
virtual Group open(const std::string &name) const
Open a group.
Definition: Group.cpp:87
Has_Variables vars
Use this to access variables.
Definition: Group.h:123
virtual bool exists(const std::string &name) const
Definition: Group.cpp:65
virtual Attribute open(const std::string &name) const
Open an Attribute by name.
Variable createWithScales(const std::string &name, const std::vector< Variable > &dimension_scales, const VariableCreationParameters &params=VariableCreationParameters::defaulted< DataType >())
Convenience function to create a Variable from certain dimension scales.
virtual Variable open(const std::string &name) const
Open a Variable by name.
virtual std::vector< std::string > list() const
virtual bool exists(const std::string &name) const
Does a Variable with the specified name exist?
virtual FillValueData_t getFillValue() const
Retrieve the fill value.
Definition: Variable.cpp:111
bool isA() const
Convenience function to check a Variable's storage type.
Definition: Variable.h:99
virtual bool isDimensionScaleAttached(unsigned int DimensionNumber, const Variable &scale) const
Is a dimension scale attached to this Variable in a certain position?
Definition: Variable.cpp:288
virtual bool hasFillValue() const
Check if a variable has a fill value set.
Definition: Variable.cpp:98
virtual Dimensions getDimensions() const
Definition: Variable.cpp:160
virtual std::vector< std::vector< Named_Variable > > getDimensionScaleMappings(const std::list< Named_Variable > &scalesToQueryAgainst, bool firstOnly=true) const
Which dimensions are attached at which positions? This function may offer improved performance on som...
Definition: Variable.cpp:303
virtual Variable read(gsl::span< char > data, const Type &in_memory_dataType, const Selection &mem_selection=Selection::all, const Selection &file_selection=Selection::all) const
Read the Variable - as char array. Ordering is row-major.
Definition: Variable.cpp:330
virtual Variable write(gsl::span< char > data, const Type &in_memory_dataType, const Selection &mem_selection=Selection::all, const Selection &file_selection=Selection::all)
The fundamental write function. Backends overload this function to implement all write operations.
Definition: Variable.cpp:317
virtual Variable resize(const std::vector< Dimensions_t > &newDims)
Resize the variable.
Definition: Variable.cpp:172
IODA_DL std::string genUniqueName()
Convenience function to generate a random file name.
Definition: HH.cpp:50
BackendNames
Backend names.
Definition: Factory.h:28
IODA_DL Group constructBackend(BackendNames name, BackendCreationParameters &params)
This is a simple factory style function that will instantiate a different backend based on a given na...
Definition: Factory.cpp:124
@ ObsStore
ObsStore in-memory.
@ Truncate_If_Exists
If the file already exists, overwrite it.
Selection & extent(const VecDimensions_t &sz)
Provide the dimensions of the object that you are selecting from.
Definition: Selection.h:111
Selection & select(const SingleSelection &s)
Append a new selection.
Definition: Selection.h:103
list newDims
Definition: 05-ObsGroup.py:95
bool extractChannelSuffixIfPresent(const std::string &name, std::string &nameWithoutChannelSuffix, int &channel)
Definition: ObsSpace.cc:49
constexpr int Unlimited
Specifies that a dimension is resizable to infinity.
std::vector< std::pair< std::string, Variable > > VarNameObjectList
typedef for holding list of variable names with associated variable object
Definition: IodaUtils.h:30
std::string fullVarName(const std::string &groupName, const std::string &varName)
form full variable name given individual group and variable names
Definition: IodaUtils.cc:120
std::vector< std::shared_ptr< NewDimensionScale_Base > > NewDimensionScales_t
std::map< std::string, std::vector< std::string > > VarDimMap
typedef for holding dim names attached to variables
Definition: IodaUtils.h:36
void collectVarDimInfo(const ObsGroup &obsGroup, VarNameObjectList &varObjectList, VarNameObjectList &dimVarObjectList, VarDimMap &dimsAttachedToVars, Dimensions_t &maxVarSize0)
collect variable and dimension information from a ioda ObsGroup
Definition: IodaUtils.cc:125
std::vector< util::DateTime > convertRefOffsetToDtime(const int refIntDtime, const std::vector< float > &timeOffsets)
convert reference, time to DateTime object
Definition: IodaUtils.cc:251
std::shared_ptr< Distribution > createReplicaDistribution(const eckit::mpi::Comm &comm, std::shared_ptr< const Distribution > master, const std::vector< std::size_t > &masterRecordNums)
Create a suitable replica distribution for the distribution master.
std::vector< util::DateTime > convertDtStringsToDtime(const std::vector< std::string > &dtStrings)
convert datetime strings to DateTime object
Definition: IodaUtils.cc:239
ObsDimensionId
Definition: src/ObsSpace.h:61
std::vector< Dimensions_t > dimsCur
The dimensions of the data.
Definition: Dimensions.h:23
Dimensions_t dimensionality
The dimensionality (rank) of the data.
Definition: Dimensions.h:25
Used to specify backend creation-time properties.
Definition: Factory.h:59
A named pair of (variable_name, ioda::Variable).
Definition: Variable.h:752
Used to specify Variable creation-time properties.
Definition: Has_Variables.h:57
VariableCreationParameters & setFillValue(DataType fill)
Definition: Has_Variables.h:69
Container used to store and manipulate fill values.
Definition: Fill.h:35