IODA
ObsIoGenerateRandom.cc
Go to the documentation of this file.
1 /*
2  * (C) Copyright 2017-2019 UCAR
3  *
4  * This software is licensed under the terms of the Apache Licence Version 2.0
5  * which can be obtained at http://www.apache.org/licenses/LICENSE-2.0.
6  */
7 
8 #include "ioda/io/ObsIoGenerateRandom.h"
9 
10 #include "ioda/Engines/Factory.h"
11 #include "ioda/io/ObsIoGenerateUtils.h"
12 #include "ioda/Misc/Dimensions.h"
13 
14 #include "oops/util/missingValues.h"
15 #include "oops/util/Random.h"
16 
17 namespace ioda {
18 
19 static ObsIoMaker<ObsIoGenerateRandom> maker("GenerateRandom");
20 
21 //----------------------------- public functions ------------------------------------
22 //-----------------------------------------------------------------------------------
24  const ObsSpaceParameters & obsSpaceParams) :
25  ObsIo() {
26  // Create an in-memory backend and attach it to an in-memory ObsGroup
27  Engines::BackendNames backendName;
29 
30  backendName = Engines::BackendNames::ObsStore;
31  Group backend = constructBackend(backendName, backendParams);
32 
34  const boost::optional<oops::Variables> & obsSimVarsVal =
35  obsSpaceParams.top_level_.simVars.value();
36 
37  oops::Log::trace() << "Constructing ObsIoGenerateRandom: Random method" << std::endl;
38 
39  // Create the in-memory ObsGroup
40  Dimensions_t numLocs = ioParams.random.numObs;
41  newDims.push_back(
42  ioda::NewDimensionScale<int>("nlocs", numLocs, numLocs, numLocs));
44 
45  // Fill in the ObsGroup with the generated data
46  genDistRandom(ioParams.random,
47  obsSpaceParams.windowStart(), obsSpaceParams.windowEnd(), obsSpaceParams.comm(),
48  ioParams.obsErrors, obsSimVarsVal->variables());
49 
50  // record counts useful for an obs source
52 
53  // Collect variable and dimension infomation for downstream use
56 
57  // record variables by which observations should be grouped into records
58  obs_grouping_vars_ = ioParams.obsGrouping.value().obsGroupVars;
59 }
60 
62 
63 //----------------------------- public functions -------------------------------
64 
65 //----------------------------- private functions -----------------------------------
66 //-----------------------------------------------------------------------------------
68  const util::DateTime & winStart,
69  const util::DateTime & winEnd,
70  const eckit::mpi::Comm & comm,
71  const std::vector<float> & obsErrors,
72  const std::vector<std::string> & simVarNames) {
73  ASSERT(obsErrors.size() == simVarNames.size());
74 
75  /// Grab the parameter values
76  int numLocs = params.numObs;
77  float latStart = params.latStart;
78  float latEnd = params.latEnd;
79  float lonStart = params.lonStart;
80  float lonEnd = params.lonEnd;
81  int ranSeed;
82  if (params.ranSeed.value() != boost::none) {
83  ranSeed = params.ranSeed.value().get();
84  } else {
85  ranSeed = std::time(0); // based on the current date/time.
86  }
87 
88  // Use the following formula to generate random lat, lon and time values.
89  //
90  // val = val1 + (random_number_between_0_and_1 * (val2-val1))
91  //
92  // where val2 > val1.
93  //
94  // Create a list of random values between 0 and 1 to be used for generating
95  // random lat, lon and time vaules.
96  //
97  // Use different seeds for lat and lon so that in the case where lat and lon ranges
98  // are the same, you get a different sequences for lat compared to lon.
99  //
100  // Have rank 0 generate the full length random sequences, and then
101  // broadcast these to the other ranks. This ensures that every rank
102  // contains the same random sequences. If all ranks generated their
103  // own sequences, which they could do, the sequences between ranks
104  // would be different in the case where random_seed is not specified.
105  std::vector<float> ranVals(numLocs, 0.0);
106  std::vector<float> ranVals2(numLocs, 0.0);
107  if (comm.rank() == 0) {
108  util::UniformDistribution<float> ranUD(numLocs, 0.0, 1.0, ranSeed);
109  util::UniformDistribution<float> ranUD2(numLocs, 0.0, 1.0, ranSeed+1);
110 
111  ranVals = ranUD.data();
112  ranVals2 = ranUD2.data();
113  }
114  comm.broadcast(ranVals, 0);
115  comm.broadcast(ranVals2, 0);
116 
117  // Form the ranges val2-val for lat, lon, time
118  float latRange = latEnd - latStart;
119  float lonRange = lonEnd - lonStart;
120  util::Duration windowDuration(winEnd - winStart);
121  float timeRange = static_cast<float>(windowDuration.toSeconds());
122 
123  // Create vectors for lat, lon, time, fill them with random values
124  // inside their respective ranges, and put results into the obs container.
125  std::vector<float> latVals(numLocs, 0.0);
126  std::vector<float> lonVals(numLocs, 0.0);
127  std::vector<std::string> dtStrings(numLocs, "");
128 
129  util::Duration durZero(0);
130  util::Duration durOneSec(1);
131  for (std::size_t ii = 0; ii < numLocs; ii++) {
132  latVals[ii] = latStart + (ranVals[ii] * latRange);
133  lonVals[ii] = lonStart + (ranVals2[ii] * lonRange);
134 
135  // Currently the filter for time stamps on obs values is:
136  //
137  // windowStart < ObsTime <= windowEnd
138  //
139  // If we get a zero offsetDt, then change it to 1 second so that the observation
140  // will remain inside the timing window.
141  util::Duration offsetDt(static_cast<int64_t>(ranVals[ii] * timeRange));
142  if (offsetDt == durZero) {
143  offsetDt = durOneSec;
144  }
145  // convert result to ISO 8601 string
146  util::DateTime dtVal = winStart + offsetDt;
147  dtStrings[ii] = dtVal.toString();
148  }
149 
150  // Transfer the generated values to the ObsGroup
151  storeGenData(latVals, lonVals, dtStrings, simVarNames, obsErrors, obs_group_);
152 }
153 
154 //-----------------------------------------------------------------------------------
155 void ObsIoGenerateRandom::print(std::ostream & os) const {
156  os << "ObsIoGenerateRandom: " << std::endl;
157 }
158 
159 } // namespace ioda
Describe the dimensions of a ioda::Attribute or ioda::Variable.
Definitions for setting up backends with file and memory I/O.
oops::RequiredParameter< int > numObs
number of observations
Groups are a new implementation of ObsSpaces.
Definition: Group.h:159
oops::Parameter< std::vector< float > > obsErrors
obs error estimates
Options controlling the ObsIoGenerateRandom class.
EmbeddedObsGenerateRandomParameters random
options shared by this class and the legacy implementation (LegacyObsGenerateParameters)
static ObsGroup generate(Group &emptyGroup, const NewDimensionScales_t &fundamentalDims, std::shared_ptr< const detail::DataLayoutPolicy > layout=nullptr)
Create an empty ObsGroup and populate it with the fundamental dimensions.
Definition: ObsGroup.cpp:72
ObsIoGenerateRandom(const Parameters_ &ioParams, const ObsSpaceParameters &obsSpaceParams)
void genDistRandom(const EmbeddedObsGenerateRandomParameters &params, const util::DateTime &winStart, const util::DateTime &winEnd, const eckit::mpi::Comm &comm, const std::vector< float > &obsErrors, const std::vector< std::string > &simVarNames)
generate observation locations using the random method
void print(std::ostream &os) const override
print routine for oops::Printable base class
Dimensions_t max_var_size_
maximum variable size (ie, first dimension size)
Definition: ObsIo.h:97
Dimensions_t nlocs_
number of locations from source (file or generator)
Definition: ObsIo.h:100
VarNameObjectList var_list_
list of regular variables from source (file or generator)
Definition: ObsIo.h:103
std::vector< std::string > obs_grouping_vars_
names of variables to be used to group observations into records
Definition: ObsIo.h:112
VarNameObjectList dim_var_list_
list of dimension scale variables from source (file or generator)
Definition: ObsIo.h:106
Dimensions_t numLocs() const
return number of locations from the source
Definition: ObsIo.h:45
VarDimMap dims_attached_to_vars_
map containing variables with their attached dimension scales
Definition: ObsIo.h:109
ObsGroup obs_group_
ObsGroup object representing io source/destination.
Definition: ObsIo.h:94
oops::Parameter< ObsGroupingParameters > obsGrouping
options controlling obs record grouping
const util::DateTime & windowEnd() const
return the end of the DA timing window
ObsTopLevelParameters top_level_
sub groups of parameters
const util::DateTime & windowStart() const
return the start of the DA timing window
const eckit::mpi::Comm & comm() const
return the associated MPI group communicator
oops::RequiredParameter< oops::Variables > simVars
simulated variables
Has_Variables vars
Use this to access variables.
Definition: Group.h:123
virtual Variable open(const std::string &name) const
Open a Variable by name.
virtual Dimensions getDimensions() const
Definition: Variable.cpp:160
BackendNames
Backend names.
Definition: Factory.h:28
IODA_DL Group constructBackend(BackendNames name, BackendCreationParameters &params)
This is a simple factory style function that will instantiate a different backend based on a given na...
Definition: Factory.cpp:124
@ ObsStore
ObsStore in-memory.
list newDims
Definition: 05-ObsGroup.py:95
static DistributionMaker< AtlasDistribution > maker(DIST_NAME)
std::vector< std::shared_ptr< NewDimensionScale_Base > > NewDimensionScales_t
void storeGenData(const std::vector< float > &latVals, const std::vector< float > &lonVals, const std::vector< std::string > &dtStrings, const std::vector< std::string > &obsVarNames, const std::vector< float > &obsErrors, ObsGroup &obsGroup)
store generated data into an ObsGroup
void collectVarDimInfo(const ObsGroup &obsGroup, VarNameObjectList &varObjectList, VarNameObjectList &dimVarObjectList, VarDimMap &dimsAttachedToVars, Dimensions_t &maxVarSize0)
collect variable and dimension information from a ioda ObsGroup
Definition: IodaUtils.cc:125
std::vector< Dimensions_t > dimsCur
The dimensions of the data.
Definition: Dimensions.h:23
Used to specify backend creation-time properties.
Definition: Factory.h:59