IODA
ObsSpaceParameters.h
Go to the documentation of this file.
1 /*
2  * (C) Copyright 2020 UCAR
3  *
4  * This software is licensed under the terms of the Apache Licence Version 2.0
5  * which can be obtained at http://www.apache.org/licenses/LICENSE-2.0.
6  */
7 
8 #ifndef OBSSPACEPARAMETERS_H_
9 #define OBSSPACEPARAMETERS_H_
10 
11 #include <string>
12 #include <vector>
13 
14 #include "ioda/core/FileFormat.h"
15 #include "ioda/core/ParameterTraitsFileFormat.h"
17 #include "ioda/Misc/Dimensions.h"
18 #include "ioda/io/ObsIoFactory.h"
19 #include "ioda/io/ObsIoParametersBase.h"
20 
21 #include "eckit/exception/Exceptions.h"
22 #include "eckit/mpi/Comm.h"
23 
24 #include "oops/base/ObsSpaceBase.h" // for ObsSpaceParametersBase
25 #include "oops/base/ParameterTraitsVariables.h"
26 #include "oops/util/DateTime.h"
27 #include "oops/util/Logger.h"
28 #include "oops/util/parameters/OptionalParameter.h"
29 #include "oops/util/parameters/Parameter.h"
30 #include "oops/util/parameters/Parameters.h"
31 #include "oops/util/parameters/RequiredParameter.h"
32 #include "oops/util/parameters/RequiredPolymorphicParameter.h"
33 
34 
35 namespace eckit {
36  class Configuration;
37 }
38 
39 namespace ioda {
40 
42  OOPS_CONCRETE_PARAMETERS(ObsFileInParameters, ObsIoParametersBase)
43 
44  public:
45  /// input obs file name
46  oops::RequiredParameter<std::string> fileName{"obsfile", this};
47 
48  /// input obs file format
49  ///
50  /// Possible values:
51  /// * `hdf5`: HDF5 file format
52  /// * `odb`: ODB file format
53  /// * `auto` (default): file format determined automatically from the file name extension
54  /// (`.odb` -- ODB, everything else -- HDF5).
55  oops::Parameter<FileFormat> format{"format", FileFormat::AUTO, this};
56 
57  /// reading from multiple files (1 per MPI task)
58  /// This option is not typically used. It is used to tell the system
59  /// to read observations from the ioda output files (one per MPI task)
60  /// from a prior run instead of reading and distributing from the original
61  /// file. This is currently being used in LETKF applictions.
62  oops::Parameter<bool> readFromSeparateFiles{"read obs from separate file", false, this};
63 
64  /// file with variable name mapping rules
65  ///
66  /// Required for obs files in the ODB format, unused otherwise.
67  oops::Parameter<std::string> mappingFile{"mapping file", "", this};
68  /// file with query parameters
69  ///
70  /// Required for obs files in the ODB format, unused otherwise.
71  oops::Parameter<std::string> queryFile{"query file", "", this};
72 };
73 
75  OOPS_CONCRETE_PARAMETERS(ObsFileOutParameters, ObsIoParametersBase)
76 
77  public:
78  /// output obs file name
79  oops::RequiredParameter<std::string> fileName{"obsfile", this};
80 };
81 
82 class ObsExtendParameters : public oops::Parameters {
83  OOPS_CONCRETE_PARAMETERS(ObsExtendParameters, oops::Parameters)
84 
85  public:
86  /// Number of model levels onto which original profiles are averaged.
87  oops::RequiredParameter<int> numModelLevels{"average profiles onto model levels", this};
88 
89  /// Variables that are filled with non-missing values when producing averaged profiles.
90  oops::Parameter<std::vector<std::string>> nonMissingExtendedVars
91  {"variables filled with non-missing values",
92  { "latitude", "longitude", "datetime", "air_pressure",
93  "air_pressure_levels", "station_id" },
94  this};
95 };
96 
98  OOPS_ABSTRACT_PARAMETERS(ObsGenerateParametersBase, ObsIoParametersBase)
99 
100  public:
101  /// obs error estimates
102  oops::Parameter<std::vector<float>> obsErrors{"obs errors", { }, this};
103 };
104 
105 class EmbeddedObsGenerateRandomParameters : public oops::Parameters {
106  OOPS_CONCRETE_PARAMETERS(EmbeddedObsGenerateRandomParameters, Parameters)
107 
108  public:
109  /// number of observations
110  oops::RequiredParameter<int> numObs{"nobs", this};
111 
112  /// latitude range start
113  oops::RequiredParameter<float> latStart{"lat1", this};
114 
115  /// latitude range end
116  oops::RequiredParameter<float> latEnd{"lat2", this};
117 
118  /// longitude range start
119  oops::RequiredParameter<float> lonStart{"lon1", this};
120 
121  /// longitude range end
122  oops::RequiredParameter<float> lonEnd{"lon2", this};
123 
124  /// random seed
125  oops::OptionalParameter<int> ranSeed{"random seed", this};
126 };
127 
128 /// Options controlling the ObsIoGenerateRandom class
130  OOPS_CONCRETE_PARAMETERS(ObsGenerateRandomParameters, ObsGenerateParametersBase)
131 
132  public:
133  /// options shared by this class and the legacy implementation (LegacyObsGenerateParameters)
135 };
136 
137 class EmbeddedObsGenerateListParameters : public oops::Parameters {
138  OOPS_CONCRETE_PARAMETERS(EmbeddedObsGenerateListParameters, Parameters)
139 
140  public:
141  /// latitude values
142  oops::RequiredParameter<std::vector<float>> lats{"lats", this};
143 
144  /// longitude values
145  oops::RequiredParameter<std::vector<float>> lons{"lons", this};
146 
147  /// datetime values
148  oops::RequiredParameter<std::vector<std::string>> datetimes{"datetimes", this};
149 };
150 
151 /// Options controlling the ObsIoGenerateList class
153  OOPS_CONCRETE_PARAMETERS(ObsGenerateListParameters, ObsGenerateParametersBase)
154 
155  public:
156  /// options shared by this class and the legacy implementation (LegacyObsGenerateParameters)
158 };
159 
160 /// \brief Options in the 'generate' YAML section.
161 ///
162 /// \note If you add or remove any Parameter member variables from this class, be sure to update
163 /// ObsTopLevelParameters::deserialize() to match.
164 class LegacyObsGenerateParameters : public oops::Parameters {
165  OOPS_CONCRETE_PARAMETERS(LegacyObsGenerateParameters, Parameters)
166 
167  public:
168  /// specification for generating using the random method
169  oops::OptionalParameter<EmbeddedObsGenerateRandomParameters> random{"random", this};
170 
171  /// specification for generating using the list method
172  oops::OptionalParameter<EmbeddedObsGenerateListParameters> list{"list", this};
173 
174  /// options controlling obs record grouping
175  oops::Parameter<ObsGroupingParameters> obsGrouping{"obsgrouping", { }, this};
176 
177  /// obs error estimates
178  oops::Parameter<std::vector<float>> obsErrors{"obs errors", { }, this};
179 
180  /// maximum frame size
181  oops::Parameter<int> maxFrameSize{"max frame size", DEFAULT_FRAME_SIZE, this};
182 };
183 
184 class ObsIoParametersWrapper : public oops::Parameters {
185  OOPS_CONCRETE_PARAMETERS(ObsIoParametersWrapper, Parameters)
186  public:
187  oops::RequiredPolymorphicParameter<ObsIoParametersBase, ObsIoFactory>
188  obsIoInParameters{"type", this};
189 };
190 
191 class ObsTopLevelParameters : public oops::ObsSpaceParametersBase {
192  OOPS_CONCRETE_PARAMETERS(ObsTopLevelParameters, ObsSpaceParametersBase)
193 
194  public:
195  /// Reimplemented to store contents of the `obsdatain` or `generate` section (if present)
196  /// in the source member variable. This makes it possible for the options related to the source
197  /// of input data to be accessed in a uniform way (regardless of in which section they were
198  /// specified) by calling obsIoInParameters().
199  void deserialize(util::CompositePath &path, const eckit::Configuration &config) override;
200 
201  /// name of obs space
202  oops::RequiredParameter<std::string> obsSpaceName{"name", this};
203 
204  /// name of MPI distribution
205  oops::Parameter<std::string> distName{"distribution", "RoundRobin", this};
206 
207  /// If saveObsDistribution/"save obs distribution" set to true,
208  /// global location indices and record numbers will be stored
209  /// in the MetaData/saved_index and MetaData/saved_record_number variables, respectively.
210  /// These variables will be saved along with all other variables
211  /// to the output files generated if the obsdataout.obsfile option is set.
212  ///
213  /// When the "obsdatain.read obs from separate file" option is set
214  /// and hence each process reads a separate input file,
215  /// the presence of these variables makes it possible
216  /// to identify observations stored in more than one input file.
217 
218  oops::Parameter<bool> saveObsDistribution{"save obs distribution", false, this};
219 
220  /// simulated variables
221  oops::RequiredParameter<oops::Variables> simVars{"simulated variables", this};
222 
223  /// Simulated variables whose observed values may be absent from the input file, but must be
224  /// created (computed) by the start of the data assimilation stage.
225  oops::Parameter<oops::Variables> derivedSimVars{"derived simulated variables", {}, this};
226 
227  /// Halo distribution center
228  oops::OptionalParameter<std::vector<float>> haloCenter{"center", this};
229 
230  /// Halo distribution radius
231  oops::OptionalParameter<float> haloRadius{"radius", this};
232 
233  /// output specification by writing to a file
234  oops::OptionalParameter<ObsFileOutParameters> obsOutFile{"obsdataout", this};
235 
236  /// extend the ObsSpace with extra fixed-size records
237  oops::OptionalParameter<ObsExtendParameters> obsExtend{"extension", this};
238 
239  /// parameters indicating where to load data from
241  if (source.value() != boost::none)
242  return source.value()->obsIoInParameters.value();
243  throw eckit::BadValue("obsIoInParameters() must not be called before deserialize()", Here());
244  }
245 
246  private:
247  /// \brief Fill this section to read observations from a file.
248  oops::OptionalParameter<ObsFileInParameters> obsInFile{"obsdatain", this};
249 
250  /// \brief Fill this section to generate observations on the fly.
251  oops::OptionalParameter<LegacyObsGenerateParameters> obsGenerate{"generate", this};
252 
253  /// \brief Fill this section instead of `obsdatain` and `generate` to load observations from
254  /// any other source.
255  oops::OptionalParameter<ObsIoParametersWrapper> source{"source", this};
256 };
257 
259  public:
260  /// sub groups of parameters
262 
263  /// Constructor
265  const util::DateTime & winStart, const util::DateTime & winEnd,
266  const eckit::mpi::Comm & comm, const eckit::mpi::Comm & timeComm) :
267  top_level_(topLevelParams),
268  win_start_(winStart), win_end_(winEnd), comm_(comm),
270  new_dims_(), max_var_size_(0) {
271  // Record the MPI rank number. The rank number is being saved during the
272  // construction of the Parameters for the ObsSpace saveToFile routine.
273  // (saveToFile will uniquify the output file name by tagging on the MPI rank
274  // number) For some reason, querying the saved MPI communicator (comm_) during
275  // the deconstruction process (when saveToFile is being run) will not reliably
276  // return the correct rank number. It was attempted to put in an MPI barrier call
277  // in case the issue was one rank finishing up before the other got to the query, but
278  // the barrier command itself caused a crash. It appears that the saved MPI
279  // communicator is getting corrupted during the deconstruction, but this has not
280  // been fully debugged, and should therefore be looked at later.
281  mpi_rank_ = comm.rank();
282  if (timeComm.size() > 1) {
283  mpi_time_rank_ = timeComm.rank();
284  } else {
285  mpi_time_rank_ = -1;
286  }
287  }
288 
289  /// \brief return the start of the DA timing window
290  const util::DateTime & windowStart() const {return win_start_;}
291 
292  /// \brief return the end of the DA timing window
293  const util::DateTime & windowEnd() const {return win_end_;}
294 
295  /// \brief return the associated MPI group communicator
296  const eckit::mpi::Comm & comm() const {return comm_;}
297 
298  /// \brief return the associated perturbations seed
299  int obsPertSeed() const {return top_level_.obsPerturbationsSeed;}
300 
301  /// \brief return the associated MPI time communicator
302  const eckit::mpi::Comm & timeComm() const {return time_comm_;}
303 
304  /// \brief set a new dimension scale
305  void setDimScale(const std::string & dimName, const Dimensions_t curSize,
306  const Dimensions_t maxSize, const Dimensions_t chunkSize) {
307  new_dims_.push_back(
308  NewDimensionScale<int>(dimName, curSize, maxSize, chunkSize));
309  }
310 
311  /// \brief get a new dimension scale
313 
314  /// \brief set the maximum variable size
315  void setMaxVarSize(const Dimensions_t maxVarSize) { max_var_size_ = maxVarSize; }
316 
317  /// \brief get the maximum variable size
318  Dimensions_t getMaxVarSize() const { return max_var_size_; }
319 
320  /// \brief get the MPI rank number
321  std::size_t getMpiRank() const { return mpi_rank_; }
322 
323  /// \brief get the MPI rank number
324  int getMpiTimeRank() const { return mpi_time_rank_; }
325 
326  private:
327  /// \brief Beginning of DA timing window
328  const util::DateTime win_start_;
329 
330  /// \brief End of DA timing window
331  const util::DateTime win_end_;
332 
333  /// \brief MPI group communicator
334  const eckit::mpi::Comm & comm_;
335 
336  /// \brief MPI time communicator
337  const eckit::mpi::Comm & time_comm_;
338 
339  /// \brief new dimension scales for output file construction
341 
342  /// \brief maximum variable size for output file contruction
343  Dimensions_t max_var_size_;
344 
345  /// \brief group MPI rank number for output file construction
346  std::size_t mpi_rank_;
347 
348  /// \brief time MPI rank number of output file construction
350 };
351 
352 } // namespace ioda
353 
354 #endif // OBSSPACEPARAMETERS_H_
Convenience classes for constructing ObsSpaces and setting up new Dimension Scales.
Describe the dimensions of a ioda::Attribute or ioda::Variable.
oops::RequiredParameter< std::vector< float > > lats
latitude values
oops::RequiredParameter< std::vector< std::string > > datetimes
datetime values
oops::RequiredParameter< std::vector< float > > lons
longitude values
oops::RequiredParameter< float > latEnd
latitude range end
oops::RequiredParameter< float > lonStart
longitude range start
oops::RequiredParameter< float > latStart
latitude range start
oops::OptionalParameter< int > ranSeed
random seed
oops::RequiredParameter< float > lonEnd
longitude range end
oops::RequiredParameter< int > numObs
number of observations
Options in the 'generate' YAML section.
oops::Parameter< std::vector< float > > obsErrors
obs error estimates
oops::Parameter< ObsGroupingParameters > obsGrouping
options controlling obs record grouping
oops::OptionalParameter< EmbeddedObsGenerateRandomParameters > random
specification for generating using the random method
oops::OptionalParameter< EmbeddedObsGenerateListParameters > list
specification for generating using the list method
oops::Parameter< int > maxFrameSize
maximum frame size
oops::Parameter< std::vector< std::string > > nonMissingExtendedVars
Variables that are filled with non-missing values when producing averaged profiles.
oops::RequiredParameter< int > numModelLevels
Number of model levels onto which original profiles are averaged.
oops::Parameter< FileFormat > format
oops::Parameter< std::string > queryFile
oops::Parameter< std::string > mappingFile
oops::Parameter< bool > readFromSeparateFiles
oops::RequiredParameter< std::string > fileName
input obs file name
oops::RequiredParameter< std::string > fileName
output obs file name
Options controlling the ObsIoGenerateList class.
EmbeddedObsGenerateListParameters list
options shared by this class and the legacy implementation (LegacyObsGenerateParameters)
oops::Parameter< std::vector< float > > obsErrors
obs error estimates
Options controlling the ObsIoGenerateRandom class.
EmbeddedObsGenerateRandomParameters random
options shared by this class and the legacy implementation (LegacyObsGenerateParameters)
Base of classes storing the configuration parameters of ObsIo subclasses.
oops::RequiredPolymorphicParameter< ObsIoParametersBase, ObsIoFactory > obsIoInParameters
const eckit::mpi::Comm & time_comm_
MPI time communicator.
int obsPertSeed() const
return the associated perturbations seed
NewDimensionScales_t new_dims_
new dimension scales for output file construction
int getMpiTimeRank() const
get the MPI rank number
const util::DateTime & windowEnd() const
return the end of the DA timing window
void setMaxVarSize(const Dimensions_t maxVarSize)
set the maximum variable size
ObsTopLevelParameters top_level_
sub groups of parameters
std::size_t mpi_rank_
group MPI rank number for output file construction
std::size_t getMpiRank() const
get the MPI rank number
NewDimensionScales_t getDimScales() const
get a new dimension scale
const util::DateTime win_start_
Beginning of DA timing window.
const eckit::mpi::Comm & comm_
MPI group communicator.
void setDimScale(const std::string &dimName, const Dimensions_t curSize, const Dimensions_t maxSize, const Dimensions_t chunkSize)
set a new dimension scale
Dimensions_t getMaxVarSize() const
get the maximum variable size
int mpi_time_rank_
time MPI rank number of output file construction
const eckit::mpi::Comm & timeComm() const
return the associated MPI time communicator
const util::DateTime & windowStart() const
return the start of the DA timing window
const eckit::mpi::Comm & comm() const
return the associated MPI group communicator
const util::DateTime win_end_
End of DA timing window.
ObsSpaceParameters(const ObsTopLevelParameters &topLevelParams, const util::DateTime &winStart, const util::DateTime &winEnd, const eckit::mpi::Comm &comm, const eckit::mpi::Comm &timeComm)
Constructor.
Dimensions_t max_var_size_
maximum variable size for output file contruction
oops::OptionalParameter< ObsFileInParameters > obsInFile
Fill this section to read observations from a file.
oops::OptionalParameter< float > haloRadius
Halo distribution radius.
oops::OptionalParameter< LegacyObsGenerateParameters > obsGenerate
Fill this section to generate observations on the fly.
oops::RequiredParameter< oops::Variables > simVars
simulated variables
void deserialize(util::CompositePath &path, const eckit::Configuration &config) override
oops::OptionalParameter< ObsIoParametersWrapper > source
Fill this section instead of obsdatain and generate to load observations from any other source.
oops::OptionalParameter< std::vector< float > > haloCenter
Halo distribution center.
oops::OptionalParameter< ObsExtendParameters > obsExtend
extend the ObsSpace with extra fixed-size records
oops::RequiredParameter< std::string > obsSpaceName
name of obs space
oops::Parameter< bool > saveObsDistribution
oops::OptionalParameter< ObsFileOutParameters > obsOutFile
output specification by writing to a file
oops::Parameter< oops::Variables > derivedSimVars
oops::Parameter< std::string > distName
name of MPI distribution
const ObsIoParametersBase & obsIoInParameters() const
parameters indicating where to load data from
std::vector< std::shared_ptr< NewDimensionScale_Base > > NewDimensionScales_t
constexpr int DEFAULT_FRAME_SIZE