IODA
IodaUtils.h
Go to the documentation of this file.
1 /*
2  * (C) Copyright 2018-2019 UCAR
3  *
4  * This software is licensed under the terms of the Apache Licence Version 2.0
5  * which can be obtained at http://www.apache.org/licenses/LICENSE-2.0.
6  */
7 
8 #ifndef CORE_IODAUTILS_H_
9 #define CORE_IODAUTILS_H_
10 
11 #include <map>
12 #include <string>
13 #include <typeinfo>
14 #include <utility>
15 #include <vector>
16 
17 #include "eckit/config/LocalConfiguration.h"
18 
19 #include "ioda/Misc/Dimensions.h"
20 #include "ioda/ObsGroup.h"
22 
23 #include "oops/util/abor1_cpp.h"
24 #include "oops/util/DateTime.h"
25 #include "oops/util/Duration.h"
26 #include "oops/util/missingValues.h"
27 
28 
29 namespace ioda {
30  class ObsSpaceParameters;
31 
32  /// \brief typedef for holding list of variable names with associated variable object
33  typedef std::vector<std::pair<std::string, Variable>> VarNameObjectList;
34 
35  /// \brief typedef for holding dim names attached to variables
36  typedef std::map<std::string, std::vector<std::string>> VarDimMap;
37 
38  // Utilities for converting back and forth between vector of strings and
39  // a 2D character array.
40  std::vector<std::size_t> CharShapeFromStringVector(
41  const std::vector<std::string> & StringVector);
42 
43  std::vector<std::string> CharArrayToStringVector(const char * CharData,
44  const std::vector<std::size_t> & CharShape);
45 
46  void StringVectorToCharArray(const std::vector<std::string> & StringVector,
47  const std::vector<std::size_t> & CharShape, char * CharData);
48 
49  std::size_t FindMaxStringLength(const std::vector<std::string> & StringVector);
50  std::string TypeIdName(const std::type_info & TypeId);
51 
52  /// \brief form full variable name given individual group and variable names
53  /// \details This routine will form the consistent frontend variable name according
54  // to the layout policy. This is defined as "groupName/varName".
55  /// \param groupName name of group
56  /// \param varName name of variable
57  std::string fullVarName(const std::string & groupName, const std::string & varName);
58 
59  /// \brief collect variable and dimension information from a ioda ObsGroup
60  /// \details It is assumed that the input ObsGroup has been populated. For example
61  /// you open an existing hdf5 file, and then call this routing to collect
62  /// the information. The information collected is passed back through the
63  /// output parameters (last 4 parameters) of this routine.
64  ///
65  /// The reason for collecting all of this information in a single routine is
66  /// to handle severe performance issues with the HDF5 library when inspecting
67  /// an ObsGroup based on an HDF5 backend.
68  ///
69  /// \param obsGroup ioda ObsGroup object
70  /// \param varObjectList list of regular variable names with associated Variable objects
71  /// \param dimVarObjectList list of dimension variable names with associated Variable objects
72  /// \param dimsAttachedToVars map structure holding list of dimension scale names attached
73  /// each regular variable
74  /// \param maxVarSize0 maximum var length along the first (0th) dimension
75  void collectVarDimInfo(const ObsGroup & obsGroup, VarNameObjectList & varObjectList,
76  VarNameObjectList & dimVarObjectList, VarDimMap & dimsAttachedToVars,
77  Dimensions_t & maxVarSize0);
78 
79  /// \brief get variable data type
80  std::type_index varDtype(const Group & group, const std::string & varName);
81 
82  /// \brief true if variable is a dimension scale
83  bool varIsDimScale(const Group & group, const std::string & varName);
84 
85  /// \brief convert reference, time to DateTime object
86  /// \param refDtime reference date time
87  /// \param timeOffets offset time values (in hours)
88  std::vector<util::DateTime> convertRefOffsetToDtime(const int refIntDtime,
89  const std::vector<float> & timeOffsets);
90 
91  /// \brief convert datetime strings to DateTime object
92  /// \param dtStrings datetime strings
93  std::vector<util::DateTime> convertDtStringsToDtime(const std::vector<std::string> & dtStrings);
94 
95  /// \brief convert 2D string array to a vector of strings
96  /// \details The incoming 2D strings array is passed in through the arrayData argument
97  /// as a flattened vector. The arrayShape arugument shows how to un-flatten the arrayData.
98  /// \param arrayData Flattened data for input 2D string array
99  /// \param arrayShape Shape of input arrayData
100  std::vector<std::string> StringArrayToStringVector(
101  const std::vector<std::string> & arrayData,
102  const std::vector<Dimensions_t> & arrayShape);
103 
104  /// \brief set params for output file construction from test YAML configuration
105  /// \details This routine is intended for use by the ObsIo and ObsFrame tests. It
106  /// relies on test confiruation "test data.write dimensions" and
107  /// "test data.write variables" accompanying an "obsdataout.obsfile" spec in the
108  /// YAML configuration.
109  /// \param obsConfig test YAML configuration for and ObsSpace
110  /// \param obsParams output params
111  void setOfileParamsFromTestConfig(const eckit::LocalConfiguration & obsConfig,
112  ioda::ObsSpaceParameters & obsParams);
113 
114  /// \brief uniquify the output file name
115  /// \details This function will tag on the MPI task number to the end of the file name
116  /// to avoid collisions when running with multiple MPI tasks.
117  /// \param fileName raw output file name
118  /// \param rankNum MPI group communicator rank number
119  /// \param timeRankNum MPI time communicator rank number
120  std::string uniquifyFileName(const std::string & fileName, const std::size_t rankNum,
121  const int timeRankNum);
122 
123  /// \brief form a map containing lists of dimension variables that are attached to each
124  /// variable
125  /// \param varContainer Has_Variables object with variables to check
126  /// \param varList list of regular variables
127  /// \param dimVarList list of dimension scale variables
129  const std::vector<std::string> & varList,
130  const std::vector<std::string> & dimVarList);
131 
132  /// \brief convert the new format varible name to the old format
133  /// \param varName new format variable name
134  std::string convertNewVnameToOldVname(const std::string & varName);
135 
136  // -----------------------------------------------------------------------------
137  /*!
138  * \details This method will perform numeric data type conversions. This method is aware
139  * of the IODA missing values and will convert these appropriately. For
140  * example when converting double to float, all double missing values will
141  * be replaced with float missing values during the conversion.
142  *
143  * \param[in] FromVar Vector of variable we are converting from
144  * \param[out] ToVar Vector of variable we are converting to
145  * \param[in] VarSize Total number of elements in FromVar and ToVar.
146  */
147  template<typename FromType, typename ToType>
148  void ConvertVarType(const std::vector<FromType> & FromVar, std::vector<ToType> & ToVar) {
149  ToVar.resize(FromVar.size());
150 
151  std::string FromTypeName = TypeIdName(typeid(FromType));
152  std::string ToTypeName = TypeIdName(typeid(ToType));
153  const FromType FromMiss = util::missingValue(FromMiss);
154  const ToType ToMiss = util::missingValue(ToMiss);
155 
156  // In any type change, the missing values need to be switched.
157  //
158  // Allow type changes between numeric types (int, float, double). These can
159  // be handled with the standard conversions.
160  bool FromTypeOkay = ((typeid(FromType) == typeid(int)) ||
161  (typeid(FromType) == typeid(float)) ||
162  (typeid(FromType) == typeid(double)));
163 
164  bool ToTypeOkay = ((typeid(ToType) == typeid(int)) ||
165  (typeid(ToType) == typeid(float)) ||
166  (typeid(ToType) == typeid(double)));
167 
168  if (FromTypeOkay && ToTypeOkay) {
169  for (std::size_t i = 0; i < FromVar.size(); i++) {
170  if (FromVar[i] == FromMiss) {
171  ToVar[i] = ToMiss;
172  } else {
173  ToVar[i] = static_cast<ToType>(FromVar[i]);
174  }
175  }
176  } else {
177  std::string ErrorMsg = "Unsupported variable data type conversion: " +
178  FromTypeName + " to " + ToTypeName;
179  ABORT(ErrorMsg);
180  }
181  }
182 } // namespace ioda
183 
184 #endif // CORE_IODAUTILS_H_
Describe the dimensions of a ioda::Attribute or ioda::Variable.
Interfaces for ioda::ObsGroup and related classes.
Interfaces for ioda::Variable and related classes.
Groups are a new implementation of ObsSpaces.
Definition: Group.h:159
This class exists inside of ioda::Group and provides the interface to manipulating Variables.
An ObsGroup is a specialization of a ioda::Group. It provides convenience functions and guarantees th...
Definition: ObsGroup.h:32
void StringVectorToCharArray(const std::vector< std::string > &StringVector, const std::vector< std::size_t > &CharShape, char *CharData)
Definition: IodaUtils.cc:70
std::vector< std::size_t > CharShapeFromStringVector(const std::vector< std::string > &StringVector)
Definition: IodaUtils.cc:20
std::vector< std::pair< std::string, Variable > > VarNameObjectList
typedef for holding list of variable names with associated variable object
Definition: IodaUtils.h:30
std::string fullVarName(const std::string &groupName, const std::string &varName)
form full variable name given individual group and variable names
Definition: IodaUtils.cc:120
void ConvertVarType(const std::vector< FromType > &FromVar, std::vector< ToType > &ToVar)
Definition: IodaUtils.h:148
VarDimMap genDimsAttachedToVars(const Has_Variables &varContainer, const std::vector< std::string > &varList, const std::vector< std::string > &dimVarList)
form a map containing lists of dimension variables that are attached to each variable
std::map< std::string, std::vector< std::string > > VarDimMap
typedef for holding dim names attached to variables
Definition: IodaUtils.h:36
std::type_index varDtype(const Group &group, const std::string &varName)
get variable data type
Definition: IodaUtils.cc:221
std::vector< std::string > CharArrayToStringVector(const char *CharData, const std::vector< std::size_t > &CharShape)
Definition: IodaUtils.cc:36
std::string uniquifyFileName(const std::string &fileName, const std::size_t rankNum, const int timeRankNum)
uniquify the output file name
Definition: IodaUtils.cc:343
void collectVarDimInfo(const ObsGroup &obsGroup, VarNameObjectList &varObjectList, VarNameObjectList &dimVarObjectList, VarDimMap &dimsAttachedToVars, Dimensions_t &maxVarSize0)
collect variable and dimension information from a ioda ObsGroup
Definition: IodaUtils.cc:125
std::vector< util::DateTime > convertRefOffsetToDtime(const int refIntDtime, const std::vector< float > &timeOffsets)
convert reference, time to DateTime object
Definition: IodaUtils.cc:251
bool varIsDimScale(const Group &group, const std::string &varName)
true if variable is a dimension scale
Definition: IodaUtils.cc:233
std::size_t FindMaxStringLength(const std::vector< std::string > &StringVector)
Definition: IodaUtils.cc:109
std::string TypeIdName(const std::type_info &TypeId)
Definition: IodaUtils.cc:89
void setOfileParamsFromTestConfig(const eckit::LocalConfiguration &obsConfig, ioda::ObsSpaceParameters &obsParams)
set params for output file construction from test YAML configuration
Definition: IodaUtils.cc:306
std::vector< util::DateTime > convertDtStringsToDtime(const std::vector< std::string > &dtStrings)
convert datetime strings to DateTime object
Definition: IodaUtils.cc:239
std::string convertNewVnameToOldVname(const std::string &varName)
convert the new format varible name to the old format
Definition: IodaUtils.cc:365
std::vector< std::string > StringArrayToStringVector(const std::vector< std::string > &arrayData, const std::vector< Dimensions_t > &arrayShape)
convert 2D string array to a vector of strings
Definition: IodaUtils.cc:274