IODA
ObsFrameRead.cc
Go to the documentation of this file.
1 /*
2  * (C) Copyright 2017-2019 UCAR
3  *
4  * This software is licensed under the terms of the Apache Licence Version 2.0
5  * which can be obtained at http://www.apache.org/licenses/LICENSE-2.0.
6  */
7 
8 #include "oops/util/abor1_cpp.h"
9 
10 #include "oops/util/Logger.h"
11 
12 #include "ioda/distribution/DistributionFactory.h"
13 #include "ioda/io/ObsFrameRead.h"
14 #include "ioda/io/ObsIoFactory.h"
15 
16 namespace ioda {
17 
18 //--------------------------- public functions ---------------------------------------
19 //------------------------------------------------------------------------------------
21  ObsFrame(params) {
22  // Create the ObsIo object
24  eckit::LocalConfiguration distConf = params.top_level_.toConfiguration();
25  distname_ = distConf.getString("distribution", "RoundRobin");
26 
27  // Create an MPI distribution
28  each_process_reads_separate_obs_ = obs_io_->eachProcessGeneratesSeparateObs();
30  if ("Halo" == distname_) {
31  dist_ = DistributionFactory::create(params.comm(), distConf);
32  } else {
33  // On each process the obs_io_ object will produce a separate series of observations,
34  // so we need to use a non-overlapping distribution. The RoundRobin will do.
35  eckit::LocalConfiguration rrConf;
36  rrConf.set("distribution", "RoundRobin");
37  dist_ = DistributionFactory::create(params.comm(), rrConf);
38  }
39  } else {
40  dist_ = DistributionFactory::create(params.comm(), distConf);
41  }
42 
43  max_frame_size_ = params.top_level_.obsIoInParameters().maxFrameSize;
44  oops::Log::debug() << "ObsFrameRead: maximum frame size: " << max_frame_size_ << std::endl;
45 }
46 
48 
49 //------------------------------------------------------------------------------------
51  // reset counters, etc.
52  frame_start_ = 0;
54  // Ensure record numbers assigned on different processes don't overlap
55  next_rec_num_ = params_.comm().rank();
56  rec_num_increment_ = params_.comm().size();
57  } else {
58  next_rec_num_ = 0;
60  }
61  unique_rec_nums_.clear();
62  max_var_size_ = obs_io_->maxVarSize();
63  nlocs_ = 0;
65  gnlocs_ = 0;
66 
67  // create an ObsGroup based frame with an in-memory backend
68  createFrameFromObsGroup(obs_io_->varList(), obs_io_->dimVarList(), obs_io_->varDimMap());
69 
70  // record the variable name <-> dim names associations.
72 }
73 
74 //------------------------------------------------------------------------------------
78 }
79 
80 //------------------------------------------------------------------------------------
82  bool haveAnotherFrame = (frame_start_ < max_var_size_);
83  // If there is another frame, then read it into obs_frame_
84  if (haveAnotherFrame) {
85  // Resize along the nlocs dimension
88  { std::pair<Variable, Dimensions_t>(nlocsVar, frameCount("nlocs")) });
89 
90  // Transfer all variable data
91  Dimensions_t frameStart = this->frameStart();
92  for (auto & varNameObject : obs_io_->varList()) {
93  std::string varName = varNameObject.first;
94  Variable sourceVar = varNameObject.second;
95  Dimensions_t frameCount = this->basicFrameCount(sourceVar);
96  if (frameCount > 0) {
97  // Transfer the variable data for this frame. Do this in two steps:
98  // ObsIo --> memory buffer --> frame storage
99 
100  // Selection objects for transfer;
101  std::vector<Dimensions_t> varShape = sourceVar.getDimensions().dimsCur;
102  Selection obsIoSelect = createObsIoSelection(varShape, frameStart, frameCount);
103  Selection memBufferSelect = createMemSelection(varShape, frameCount);
104  Selection obsFrameSelect = createEntireFrameSelection(varShape, frameCount);
105 
106  // Transfer the data
107  Variable destVar = obs_frame_.vars.open(varName);
108  if (destVar.isA<int>()) {
109  std::vector<int> varValues;
110  sourceVar.read<int>(varValues, memBufferSelect, obsIoSelect);
111  destVar.write<int>(varValues, memBufferSelect, obsFrameSelect);
112  } else if (destVar.isA<float>()) {
113  std::vector<float> varValues;
114  sourceVar.read<float>(varValues, memBufferSelect, obsIoSelect);
115  destVar.write<float>(varValues, memBufferSelect, obsFrameSelect);
116  } else if (destVar.isA<std::string>()) {
117  std::vector<std::string> varValues;
118  sourceVar.read<std::string>(varValues, memBufferSelect, obsIoSelect);
119  destVar.write<std::string>(varValues, memBufferSelect, obsFrameSelect);
120  }
121  }
122  }
123 
124  // generate the frame index and record numbers for this frame
126 
127  // clear the selection caches
128  known_frame_selections_.clear();
129  known_mem_selections_.clear();
130  } else {
131  if (obs_io_->eachProcessGeneratesSeparateObs()) {
132  // sum up global location counts on all PEs
133  params_.comm().allReduceInPlace(gnlocs_, eckit::mpi::sum());
134  params_.comm().allReduceInPlace(gnlocs_outside_timewindow_, eckit::mpi::sum());
135  }
136  // assign each record to the patch of a unique PE
137  dist_->computePatchLocs();
138  }
139  return (haveAnotherFrame);
140 }
141 
142 //------------------------------------------------------------------------------------
143 Dimensions_t ObsFrameRead::frameStart() {
144  return frame_start_;
145 }
146 
147 //------------------------------------------------------------------------------------
148 Dimensions_t ObsFrameRead::frameCount(const std::string & varName) {
149  Variable var = obs_io_->vars().open(varName);
150  Dimensions_t fCount;
151  if (var.isDimensionScale()) {
152  fCount = basicFrameCount(var);
153  } else {
154  if (obs_io_->isVarDimByNlocs(varName)) {
156  } else {
157  fCount = basicFrameCount(var);
158  }
159  }
160  return fCount;
161 }
162 
163 //-----------------------------------------------------------------------------------
164 bool ObsFrameRead::readFrameVar(const std::string & varName, std::vector<int> & varData) {
165  return readFrameVarHelper<int>(varName, varData);
166 }
167 bool ObsFrameRead::readFrameVar(const std::string & varName, std::vector<float> & varData) {
168  return readFrameVarHelper<float>(varName, varData);
169 }
170 bool ObsFrameRead::readFrameVar(const std::string & varName,
171  std::vector<std::string> & varData) {
172  return readFrameVarHelper<std::string>(varName, varData);
173 }
174 
175 //--------------------------- private functions --------------------------------------
176 //-----------------------------------------------------------------------------------
177 void ObsFrameRead::print(std::ostream & os) const {
178  os << "ObsFrameRead: " << std::endl;
179 }
180 
181 //------------------------------------------------------------------------------------
182 Dimensions_t ObsFrameRead::basicFrameCount(const Variable & var) {
183  Dimensions_t count;
184  Dimensions_t varSize0 = var.getDimensions().dimsCur[0];
185  if ((frame_start_ + max_frame_size_) > varSize0) {
186  count = varSize0 - frame_start_;
187  if (count < 0) { count = 0; }
188  } else {
189  count = max_frame_size_;
190  }
191  return count;
192 }
193 
194 //------------------------------------------------------------------------------------
195 Selection ObsFrameRead::createIndexedFrameSelection(const std::vector<Dimensions_t> & varShape) {
196  // frame_loc_index_ contains the indices for the first dimension. Subsequent
197  // dimensions, we want to select all indices.
198  Selection indexedFrameSelect;
199  indexedFrameSelect.extent(varShape)
201  for (std::size_t i = 1; i < varShape.size(); ++i) {
202  std::vector<Dimensions_t> dimIndex(varShape[i]);
203  std::iota(dimIndex.begin(), dimIndex.end(), 0);
204  indexedFrameSelect.extent(varShape).select({ SelectionOperator::AND, i, dimIndex });
205  }
206  return indexedFrameSelect;
207 }
208 
209 // -----------------------------------------------------------------------------
210 void ObsFrameRead::genFrameIndexRecNums(std::shared_ptr<Distribution> & dist) {
211  // Generate location indices relative to the obs source (locIndex) and relative
212  // to the current frame (frameIndex).
213  std::vector<Dimensions_t> locIndex;
214  std::vector<Dimensions_t> frameIndex;
215 
216  // Apply the timing window. Need to filter out locations that are outside the
217  // timing window before generating record numbers. This is because
218  // we are generating record numbers on the fly since we want to get to the point where
219  // we can do the MPI distribution without knowing how many obs (and records) we are going
220  // to encounter. Only apply the timing window in the case of reading from a file.
221  if (obs_io_->applyTimingWindow()) {
222  genFrameLocationsTimeWindow(locIndex, frameIndex);
223  } else {
224  genFrameLocationsAll(locIndex, frameIndex);
225  }
226 
227  // Generate record numbers for this frame. Consider obs grouping.
228  std::vector<Dimensions_t> records;
229  const std::vector<std::string> &obsGroupVarList = obs_io_->obsGroupingVars();
230  if (obsGroupVarList.empty()) {
231  genRecordNumbersAll(locIndex, records);
232  } else {
233  genRecordNumbersGrouping(obsGroupVarList, frameIndex, records);
234  }
235 
236  // Apply the MPI distribution to the records
237  applyMpiDistribution(dist, locIndex, records);
238 
239  // New frame count is the number of entries in the frame_loc_index_ vector
240  // This will be handed to callers through the frameCount function for all
241  // variables with nlocs as their first dimension.
243 }
244 
245 //------------------------------------------------------------------------------------
246 void ObsFrameRead::genFrameLocationsAll(std::vector<Dimensions_t> & locIndex,
247  std::vector<Dimensions_t> & frameIndex) {
248  Dimensions_t locSize = this->frameCount("nlocs");
249  gnlocs_ += locSize;
250 
251  locIndex.resize(locSize);
252  std::iota(locIndex.begin(), locIndex.end(), this->frameStart());
253 
254  frameIndex.resize(locSize);
255  std::iota(frameIndex.begin(), frameIndex.end(), 0);
256 }
257 
258 //------------------------------------------------------------------------------------
259 void ObsFrameRead::genFrameLocationsTimeWindow(std::vector<Dimensions_t> & locIndex,
260  std::vector<Dimensions_t> & frameIndex) {
261  Dimensions_t frameCount = this->frameCount("nlocs");
262  Dimensions_t frameStart = this->frameStart();
263 
264  // Prefer MetaData/datetime. Eventually "MetaData/time" will be obsoleted.
265  std::string dtVarName;
266  if (obs_frame_.vars.exists("MetaData/datetime")) {
267  dtVarName = std::string("MetaData/datetime");
268  } else if (obs_frame_.vars.exists("MetaData/time")) {
269  dtVarName = std::string("MetaData/time");
270  } else {
271  std::string ErrMsg =
272  std::string("ERROR: ObsFrameRead::genFrameLocationsTimeWindow: ") +
273  std::string("date time information does not exist, ") +
274  std::string("cannot perform time window filtering");
275  throw eckit::UserError(ErrMsg, Here());
276  }
277 
278  // Build the selection objects
279  Variable dtVar = obs_frame_.vars.open(dtVarName);
280  std::vector<Dimensions_t> varShape = dtVar.getDimensions().dimsCur;
281  Selection memSelect = createMemSelection(varShape, frameCount);
282  Selection frameSelect = createEntireFrameSelection(varShape, frameCount);
283 
284  // convert ref, offset time to datetime objects
285  std::vector<util::DateTime> dtimeVals;
286  if (dtVarName == "MetaData/datetime") {
287  std::vector<std::string> dtValues;
288  dtVar.read<std::string>(dtValues, memSelect, frameSelect);
289  dtValues.resize(frameCount);
290 
291  dtimeVals = convertDtStringsToDtime(dtValues);
292  } else {
293  std::vector<float> dtValues;
294  dtVar.read<float>(dtValues, memSelect, frameSelect);
295  dtValues.resize(frameCount);
296 
297  int refDtime;
298  this->obs_io_->atts().open("date_time").read<int>(refDtime);
299  dtimeVals = convertRefOffsetToDtime(refDtime, dtValues);
300  }
301 
302  // Keep all locations that fall inside the timing window. Note iloc will be set
303  // to the number of locations stored in the output vectors after exiting the
304  // following for loop.
305  locIndex.resize(frameCount);
306  frameIndex.resize(frameCount);
307  std::size_t iloc = 0;
308  for (std::size_t i = 0; i < frameCount; ++i) {
309  if (this->insideTimingWindow(dtimeVals[i])) {
310  locIndex[iloc] = frameStart + i;
311  frameIndex[iloc] = i;
312  iloc++;
313  } else {
315  }
316  }
317  locIndex.resize(iloc);
318  frameIndex.resize(iloc);
319  gnlocs_ += iloc;
320 }
321 
322 //------------------------------------------------------------------------------------
323 void ObsFrameRead::genRecordNumbersAll(const std::vector<Dimensions_t> & locIndex,
324  std::vector<Dimensions_t> & records) {
325  // No obs grouping. Assign each location to a separate record.
326  Dimensions_t locSize = locIndex.size();
327  records.assign(locSize, 0);
328  for (std::size_t i = 0; i < locSize; ++i) {
329  records[i] = next_rec_num_;
331  }
332 }
333 
334 //------------------------------------------------------------------------------------
335 void ObsFrameRead::genRecordNumbersGrouping(const std::vector<std::string> & obsGroupVarList,
336  const std::vector<Dimensions_t> & frameIndex,
337  std::vector<Dimensions_t> & records) {
338  // Form the selection objects for reading the variables
339 
340  // Applying obs grouping. First convert all of the group variable data values for this
341  // frame into string key values. This is done in one call to minimize accessing the
342  // frame data for the grouping variables.
343  std::size_t locSize = frameIndex.size();
344  records.assign(locSize, 0);
345  std::vector<std::string> obsGroupingKeys(locSize);
346  buildObsGroupingKeys(obsGroupVarList, frameIndex, obsGroupingKeys);
347 
348  for (std::size_t i = 0; i < locSize; ++i) {
349  if (obs_grouping_.find(obsGroupingKeys[i]) == obs_grouping_.end()) {
350  // key is not present in the map
351  // assign current record number to the current key, and move to the next record number
352  obs_grouping_.insert(
353  std::pair<std::string, std::size_t>(obsGroupingKeys[i], next_rec_num_));
355  }
356  records[i] = obs_grouping_.at(obsGroupingKeys[i]);
357  }
358 }
359 
360 //------------------------------------------------------------------------------------
361 void ObsFrameRead::buildObsGroupingKeys(const std::vector<std::string> & obsGroupVarList,
362  const std::vector<Dimensions_t> & frameIndex,
363  std::vector<std::string> & groupingKeys) {
364  // Walk though each variable and construct the segments of the key values (strings)
365  // Append the segments as each variable is encountered.
366  for (std::size_t i = 0; i < obsGroupVarList.size(); ++i) {
367  // Retrieve the variable values from the obs frame and convert
368  // those values to strings. Then append those "value" strings from each
369  // variable to form the grouping keys.
370  std::string obsGroupVarName = obsGroupVarList[i];
371  std::string varName = std::string("MetaData/") + obsGroupVarName;
372  Variable groupVar = obs_frame_.vars.open(varName);
373  if (!obs_io_->isVarDimByNlocs(varName)) {
374  std::string ErrMsg =
375  std::string("ERROR: ObsFrameRead::genRecordNumbersGrouping: ") +
376  std::string("obs grouping variable (") + obsGroupVarName +
377  std::string(") must have 'nlocs' as first dimension");
378  ABORT(ErrMsg);
379  }
380 
381  // Form selection objects to grab the current frame values
382  Dimensions_t frameStart = this->frameStart();
383  Dimensions_t frameCount = this->frameCount("nlocs");
384 
385  std::vector<Dimensions_t> varShape = groupVar.getDimensions().dimsCur;
386  Selection memSelect = createMemSelection(varShape, frameCount);
387  Selection frameSelect = createEntireFrameSelection(varShape, frameCount);
388 
389  std::string keySegment;
390  if (groupVar.isA<int>()) {
391  std::vector<int> groupVarValues;
392  groupVar.read<int>(groupVarValues, memSelect, frameSelect);
393  groupVarValues.resize(frameCount);
394  for (std::size_t j = 0; j < frameIndex.size(); ++j) {
395  keySegment = std::to_string(groupVarValues[frameIndex[j]]);
396  if (i == 0) {
397  groupingKeys[j] = keySegment;
398  } else {
399  groupingKeys[j] += ":";
400  groupingKeys[j] += keySegment;
401  }
402  }
403  } else if (groupVar.isA<float>()) {
404  std::vector<float> groupVarValues;
405  groupVar.read<float>(groupVarValues, memSelect, frameSelect);
406  groupVarValues.resize(frameCount);
407  for (std::size_t j = 0; j < frameIndex.size(); ++j) {
408  keySegment = std::to_string(groupVarValues[frameIndex[j]]);
409  if (i == 0) {
410  groupingKeys[j] = keySegment;
411  } else {
412  groupingKeys[j] += ":";
413  groupingKeys[j] += keySegment;
414  }
415  }
416  } else if (groupVar.isA<std::string>()) {
417  std::vector<std::string> groupVarValues;
418  groupVar.read<std::string>(groupVarValues, memSelect, frameSelect);
419  groupVarValues.resize(frameCount);
420  for (std::size_t j = 0; j < frameIndex.size(); ++j) {
421  keySegment = groupVarValues[frameIndex[j]];
422  if (i == 0) {
423  groupingKeys[j] = keySegment;
424  } else {
425  groupingKeys[j] += ":";
426  groupingKeys[j] += keySegment;
427  }
428  }
429  }
430  }
431 }
432 
433 //------------------------------------------------------------------------------------
434 void ObsFrameRead::applyMpiDistribution(const std::shared_ptr<Distribution> & dist,
435  const std::vector<Dimensions_t> & locIndex,
436  const std::vector<Dimensions_t> & records) {
437  // Read lat/lon for this frame
438  Dimensions_t locSize = locIndex.size();
439  std::vector<float> lats(locSize, 0);
440  std::vector<float> lons(locSize, 0);
441  Dimensions_t frameStart = this->frameStart();
442  // Form selection objects to grab the current frame values
443  Dimensions_t frameCount = this->frameCount("nlocs");
444 
445  // Assume that lat and lon variables are shaped the same
446  if (!obs_frame_.vars.exists("MetaData/longitude")) {
447  throw eckit::UserError("MetaData/longitude not found in observations file", Here());
448  }
449  Variable latLonVar = obs_frame_.vars.open("MetaData/longitude");
450  std::vector<Dimensions_t> varShape = latLonVar.getDimensions().dimsCur;
451  Selection memSelect = createMemSelection(varShape, frameCount);
452  Selection frameSelect = createEntireFrameSelection(varShape, frameCount);
453 
454  latLonVar.read(lons, memSelect, frameSelect);
455  lons.resize(frameCount);
456 
457  if (!obs_frame_.vars.exists("MetaData/latitude")) {
458  throw eckit::UserError("MetaData/latitude not found in observations file", Here());
459  }
460  latLonVar = obs_frame_.vars.open("MetaData/latitude");
461  latLonVar.read(lats, memSelect, frameSelect);
462  lats.resize(frameCount);
463 
464  /// If "save obs distribution" is set to true in a previous run,
465  /// global location indices and record numbers have stored
466  /// in the MetaData/saved_index and MetaData/saved_record_number variables,
467  /// along with all other variables in separate files.
468  ///
469  /// When the "obsdatain.read obs from separate file" option is set,
470  /// each process reads a separate input file generated previously,
471  /// to use the stored index and record_number.
472 
473  std::vector<int> saved_index(locSize, 0);
474  std::vector<int> saved_record_number(locSize, 0);
475 
476  if (each_process_reads_separate_obs_ && ("Halo" == distname_)) {
477  // Assume that saved_index and saved_record_number variables are shaped the same
478  if (!obs_frame_.vars.exists("MetaData/saved_record_number")) {
479  throw eckit::UserError("MetaData/saved_record_number not found in observations file",
480  Here());
481  }
482  Variable locVar = obs_frame_.vars.open("MetaData/saved_record_number");
483  varShape = locVar.getDimensions().dimsCur;
484  Selection locMemSelect = createMemSelection(varShape, frameCount);
485  Selection locFrameSelect = createEntireFrameSelection(varShape, frameCount);
486  locVar.read(saved_record_number, locMemSelect, locFrameSelect);
487  saved_record_number.resize(frameCount);
488 
489  if (!obs_frame_.vars.exists("MetaData/saved_index")) {
490  throw eckit::UserError("MetaData/saved_index not found in observations file", Here());
491  }
492  locVar = obs_frame_.vars.open("MetaData/saved_index");
493  locVar.read(saved_index, locMemSelect, locFrameSelect);
494  saved_index.resize(frameCount);
495  }
496 
497  // Generate the index and recnums for this frame.
498  const std::size_t commSize = params_.comm().size();
499  const std::size_t commRank = params_.comm().rank();
500  std::size_t rowNum = 0;
501  std::size_t recNum = 0;
502  std::size_t frameIndex = 0;
503  std::size_t globalLocIndex = 0;
504  frame_loc_index_.clear();
505  for (std::size_t i = 0; i < locSize; ++i) {
506  if (each_process_reads_separate_obs_ && ("Halo" == distname_)) {
507  rowNum = saved_index[i];
508  recNum = saved_record_number[i];
509  frameIndex = i;
510  } else {
511  rowNum = locIndex[i];
512  recNum = records[i];
513  // The current frame storage always starts at zero so frameIndex
514  // needs to be the offset from the ObsIo frame start.
515  frameIndex = rowNum - frameStart;
516  }
517 
518  eckit::geometry::Point2 point(lons[frameIndex], lats[frameIndex]);
519 
520  std::size_t globalLocIndex = rowNum;
521  if (each_process_reads_separate_obs_ && ("Halo" != distname_)) {
522  // Each process reads a different set of observations. Make sure all of them are assigned
523  // different global location indices
524  globalLocIndex = rowNum * commSize + commRank;
525  }
526  dist_->assignRecord(recNum, globalLocIndex, point);
527 
528  if (dist->isMyRecord(recNum)) {
529  indx_.push_back(globalLocIndex);
530  recnums_.push_back(recNum);
531  unique_rec_nums_.insert(recNum);
532  frame_loc_index_.push_back(frameIndex);
533  nlocs_++;
534  }
535  }
536  nrecs_ = unique_rec_nums_.size();
537 }
538 
539 // -----------------------------------------------------------------------------
540 bool ObsFrameRead::insideTimingWindow(const util::DateTime & obsDt) {
541  return ((obsDt > params_.windowStart()) && (obsDt <= params_.windowEnd()));
542 }
543 
544 } // namespace ioda
static std::unique_ptr< Distribution > create(const eckit::mpi::Comm &comm, const eckit::Configuration &config)
Create a Distribution object implementing a particular method of distributing observations across mul...
Dimensions_t nlocs_
number of locations from source (file or generator)
Definition: ObsFrame.h:170
std::shared_ptr< ObsIo > obs_io_
ObsIo object.
Definition: ObsFrame.h:161
Selection createMemSelection(const std::vector< Dimensions_t > &varShape, const Dimensions_t frameCount)
create selection object for accessing a memory buffer
Definition: ObsFrame.cc:26
void createFrameFromObsGroup(const VarNameObjectList &varList, const VarNameObjectList &dimVarList, const VarDimMap &varDimMap)
create a frame object based on dimensions and variables from a source ObsGroup
Definition: ObsFrame.cc:109
Dimensions_t max_frame_size_
maximum frame size
Definition: ObsFrame.h:183
Dimensions_t max_var_size_
maximum variable size
Definition: ObsFrame.h:186
VarDimMap ioVarDimMap() const
return map from variables to their attached dimension scales
Definition: ObsFrame.h:70
Selection createEntireFrameSelection(const std::vector< Dimensions_t > &varShape, const Dimensions_t frameCount)
create selection object for accessing the entire frame variable
Definition: ObsFrame.cc:49
Dimensions_t frame_start_
current frame starting index
Definition: ObsFrame.h:189
Selection createObsIoSelection(const std::vector< Dimensions_t > &varShape, const Dimensions_t frameStart, const Dimensions_t frameCount)
create selection object for accessing an ObsIo variable
Definition: ObsFrame.cc:91
Dimensions_t gnlocs_outside_timewindow_
number of nlocs from the file (gnlocs) that are outside the time window
Definition: ObsFrame.h:177
Dimensions_t gnlocs_
total number of locations from source (file or generator) that were selected after the timing window ...
Definition: ObsFrame.h:174
Dimensions_t nrecs_
number of records from source (file or generator)
Definition: ObsFrame.h:167
ObsSpaceParameters params_
ObsIo parameter specs.
Definition: ObsFrame.h:180
ObsGroup obs_frame_
ObsGroup object (temporary storage for a single frame)
Definition: ObsFrame.h:164
std::map< std::string, std::size_t > obs_grouping_
map for obs grouping via string keys
Dimensions_t adjusted_nlocs_frame_start_
current frame start for variable dimensioned along nlocs
Selection createIndexedFrameSelection(const std::vector< Dimensions_t > &varShape)
set up frontend and backend selection objects for the given variable
void frameNext() override
move to the next frame
Definition: ObsFrameRead.cc:75
void applyMpiDistribution(const std::shared_ptr< Distribution > &dist, const std::vector< Dimensions_t > &locIndex, const std::vector< Dimensions_t > &records)
apply MPI distribution
Dimensions_t adjusted_nlocs_frame_count_
current frame count for variable dimensioned along nlocs
Dimensions_t frameCount(const std::string &varName) override
return current frame count for variable
std::size_t rec_num_increment_
spacing between record numbers assigned on this process.
VarDimMap dims_attached_to_vars_
map showing association of dim names with each variable name
std::size_t next_rec_num_
next available record number
std::string distname_
\Brief Distribution Name
bool frameAvailable() override
true if a frame is available (not past end of frames)
Definition: ObsFrameRead.cc:81
void frameInit() override
initialize for walking through the frames
Definition: ObsFrameRead.cc:50
bool each_process_reads_separate_obs_
true if obs_io_ produces a different series of observations on each process, false if they are all th...
Dimensions_t basicFrameCount(const Variable &var)
return current frame count for variable
std::set< std::size_t > unique_rec_nums_
unique record numbers
bool readFrameVar(const std::string &varName, std::vector< int > &varData)
read a frame variable
void print(std::ostream &os) const override
print routine for oops::Printable base class
std::shared_ptr< Distribution > dist_
MPI distribution object.
void buildObsGroupingKeys(const std::vector< std::string > &obsGroupVarList, const std::vector< Dimensions_t > &frameIndex, std::vector< std::string > &groupingKeys)
generate string keys for record number assignment
void genRecordNumbersGrouping(const std::vector< std::string > &obsGroupVarList, const std::vector< Dimensions_t > &frameIndex, std::vector< Dimensions_t > &records)
generate record numbers considering obs grouping
std::map< std::vector< std::string >, Selection > known_frame_selections_
cache for frame selection
void genRecordNumbersAll(const std::vector< Dimensions_t > &locIndex, std::vector< Dimensions_t > &records)
generate record numbers where each location is a unique record (no grouping)
std::map< std::vector< std::string >, Selection > known_mem_selections_
cache for memory buffer selection
ObsFrameRead(const ObsSpaceParameters &params)
Definition: ObsFrameRead.cc:20
Dimensions_t frameStart() override
return current frame starting index
void genFrameLocationsAll(std::vector< Dimensions_t > &locIndex, std::vector< Dimensions_t > &frameIndex)
generate indices for all locations in current frame
bool insideTimingWindow(const util::DateTime &ObsDt)
std::vector< std::size_t > recnums_
record numbers associated with the location indexes
std::vector< std::size_t > indx_
indexes of locations to extract from the input obs file
void genFrameLocationsTimeWindow(std::vector< Dimensions_t > &locIndex, std::vector< Dimensions_t > &frameIndex)
generate indices for locations in current frame after filtering out obs outside DA timing window
std::vector< Dimensions_t > frame_loc_index_
location indices for current frame
void genFrameIndexRecNums(std::shared_ptr< Distribution > &dist)
generate frame indices and corresponding record numbers
void resize(const std::vector< std::pair< Variable, ioda::Dimensions_t >> &newDims)
Resize a Dimension and every Variable that depends on it.
Definition: ObsGroup.cpp:85
static std::shared_ptr< ObsIo > create(ObsIoModes mode, const ObsSpaceParameters &parameters)
Create and return a new instance of an ObsIo subclass.
Definition: ObsIoFactory.cc:24
const util::DateTime & windowEnd() const
return the end of the DA timing window
const util::DateTime & windowStart() const
return the start of the DA timing window
const eckit::mpi::Comm & comm() const
return the associated MPI group communicator
A Selection represents the bounds of the data, in ioda or in userspace, that you are reading or writi...
Definition: Selection.h:48
Variables store data!
Definition: Variable.h:680
Has_Variables vars
Use this to access variables.
Definition: Group.h:123
virtual Variable open(const std::string &name) const
Open a Variable by name.
virtual bool exists(const std::string &name) const
Does a Variable with the specified name exist?
bool isA() const
Convenience function to check a Variable's storage type.
Definition: Variable.h:99
virtual bool isDimensionScale() const
Is this Variable used as a dimension scale?
Definition: Variable.cpp:251
virtual Dimensions getDimensions() const
Definition: Variable.cpp:160
virtual Variable read(gsl::span< char > data, const Type &in_memory_dataType, const Selection &mem_selection=Selection::all, const Selection &file_selection=Selection::all) const
Read the Variable - as char array. Ordering is row-major.
Definition: Variable.cpp:330
virtual Variable write(gsl::span< char > data, const Type &in_memory_dataType, const Selection &mem_selection=Selection::all, const Selection &file_selection=Selection::all)
The fundamental write function. Backends overload this function to implement all write operations.
Definition: Variable.cpp:317
virtual Variable resize(const std::vector< Dimensions_t > &newDims)
Resize the variable.
Definition: Variable.cpp:172
Selection & extent(const VecDimensions_t &sz)
Provide the dimensions of the object that you are selecting from.
Definition: Selection.h:111
Selection & select(const SingleSelection &s)
Append a new selection.
Definition: Selection.h:103
std::vector< util::DateTime > convertRefOffsetToDtime(const int refIntDtime, const std::vector< float > &timeOffsets)
convert reference, time to DateTime object
Definition: IodaUtils.cc:251
std::vector< util::DateTime > convertDtStringsToDtime(const std::vector< std::string > &dtStrings)
convert datetime strings to DateTime object
Definition: IodaUtils.cc:239
std::vector< Dimensions_t > dimsCur
The dimensions of the data.
Definition: Dimensions.h:23