IODA
HH-util.cpp
Go to the documentation of this file.
1 /*
2  * (C) Copyright 2020-2021 UCAR
3  *
4  * This software is licensed under the terms of the Apache Licence Version 2.0
5  * which can be obtained at http://www.apache.org/licenses/LICENSE-2.0.
6  */
7 /*! \addtogroup ioda_internals_engines_hh
8  *
9  * @{
10  * \file HH-util.cpp
11  * \brief HDF5 utility functions.
12  */
13 
14 #include "./HH/HH-util.h"
15 
16 #include <hdf5_hl.h>
17 #include <algorithm>
18 #include <iterator>
19 #include <string>
20 #include <utility>
21 #include <vector>
22 
23 #include "./HH/Handles.h"
24 #include "./HH/HH-attributes.h"
25 #include "./HH/HH-variables.h"
26 #include "ioda/Exception.h"
27 
28 namespace ioda {
29 namespace detail {
30 namespace Engines {
31 namespace HH {
32 
33  /// Callback function for H5Aiterate / H5Aiterate2 / H5Aiterate1.
34 #if H5_VERSION_GE(1, 8, 0)
35 herr_t iterate_find_attr(hid_t loc_id, const char* name, const H5A_info_t* info, void* op_data) {
36 #else
37 herr_t iterate_find_attr(hid_t loc_id, const char* name, void* op_data) {
38  H5A_info_t in_info;
39  H5Aget_info_by_name(loc_id, ".", name, &in_info, H5P_DEFAULT);)
40  H5A_info_t* info = &in_info;
41 #endif
42 
44  = (Iterator_find_attr_data_t*)op_data; // NOLINT: HDF5 mandates that op_data be void*.
45 
46  if (name == nullptr) return -1;
47  if (std::string(name) == op->search_for) {
48  op->success = true;
49  return 1;
50  }
51  op->idx++;
52  return 0;
53 }
54 
55 H5_index_t getAttrCreationOrder(hid_t obj, H5O_type_t objType) {
56  if (objType != H5O_TYPE_DATASET && objType != H5O_TYPE_GROUP)
57  throw Exception("Invalid object type", ioda_Here());
58  // Apparently files do not have a creation plist. They show up as groups,
59  // so we catch this and return H5_INDEX_NAME.
60  if (objType == H5O_TYPE_GROUP) {
61  H5I_type_t typ = H5Iget_type(obj); // NOLINT
62  if (typ < 0) throw Exception("Error determining object type", ioda_Here());
63  if (typ == H5I_FILE) return H5_INDEX_NAME; // NOLINT
64  }
65 
66  unsigned crt_order_flags = 0;
67  hid_t hcreatepl
68  = (objType == H5O_TYPE_DATASET) ? H5Dget_create_plist(obj) : H5Gget_create_plist(obj);
70 
71  if (createpl() < 0) throw Exception("Cannot get creation property list", ioda_Here());
72  if (0 > H5Pget_attr_creation_order(createpl(), &crt_order_flags))
73  throw Exception("Cannot get attribute creation order", ioda_Here());
74  // We only care if this property is tracked. Indexing is performed on the fly
75  // if it is not available (and incurs a read penalty), but this has performance of
76  // at least ordering by name.
77  return (crt_order_flags & H5P_CRT_ORDER_TRACKED) // NOLINT
78  ? H5_INDEX_CRT_ORDER
79  : H5_INDEX_NAME;
80 }
81 
82 std::pair<bool, hsize_t> iterativeAttributeSearch(hid_t baseObject, const char* attname, H5_index_t iteration_type) {
83 
84  // H5Aiterate2 exists in v1.8 and up.
85  hsize_t pos = 0;
87  opts.search_for = std::string(attname);
88  herr_t append_ret
89  = H5Aiterate2(baseObject, // Search on this dataset
90  iteration_type, // Iterate by name or creation order
91  H5_ITER_NATIVE, // Fastest ordering possible
92  &pos, // Initial (and current) index
93  iterate_find_attr, // C-style search function
94  reinterpret_cast<void*>(&opts) // Data passed to/from the C-style search function
95  );
96  if (append_ret < 0) return std::pair<bool, hsize_t>(false, -2);
97  return std::pair<bool, hsize_t>(opts.success, opts.idx);
98 }
99 
100 HH_Attribute iterativeAttributeSearchAndOpen(hid_t baseObject, H5O_type_t objType,
101  const char* attname) {
102  // Get search order
103  H5_index_t iteration_type = getAttrCreationOrder(baseObject, objType);
104  auto searchres = iterativeAttributeSearch(baseObject, attname, iteration_type);
105  bool searchSuccess = searchres.first;
106  hsize_t idx = searchres.second;
107 
108  HH_Attribute aDims_HH;
109  // Either create the attribute and set its initial data or open the attribute and append.
110  if (searchSuccess) {
111  // Open attribute and read data
112  hid_t found_att = H5Aopen_by_idx(baseObject, ".", iteration_type, H5_ITER_NATIVE, idx,
113  H5P_DEFAULT, H5P_DEFAULT);
114  if (found_att < 0) throw Exception("Cannot open attribute by index", ioda_Here());
115  aDims_HH
117  } else {
118  aDims_HH
119  = HH_Attribute(HH_hid_t());
120  }
121 
122  return aDims_HH;
123 }
124 
125 
126 void attr_update_dimension_list(HH_Variable* var, const std::vector<std::vector<ref_t>>& new_dim_list) {
127  hid_t var_id = var->get()();
128 
129  auto dims = var->getDimensions();
130  // dimension of the "DIMENSION_LIST" array
131  hsize_t hdims[1] = {gsl::narrow<hsize_t>(dims.dimensionality)};
132  // The attribute's dataspace
134  if ((sid = H5Screate_simple(1, hdims, NULL)).get() < 0)
135  throw Exception("Cannot create simple dataspace.", ioda_Here());
136  // The attribute's datatype
138  if ((tid = H5Tvlen_create(H5T_STD_REF_OBJ)).get() < 0)
139  throw Exception("Cannot create variable length array type.", ioda_Here());
140  // Check if the DIMENSION_LIST attribute exists.
141  HH_Attribute aDimList = iterativeAttributeSearchAndOpen(var_id, H5O_TYPE_DATASET, DIMENSION_LIST);
142  // If the DIMENSION_LIST attribute does not exist, create it.
143  // If it exists, read it.
144  using std::vector;
145  vector<hvl_t> dimlist_in_data(dims.dimensionality);
146  if (!aDimList.get().isValid()) {
147  // Create
148  hid_t aid = H5Acreate(var_id, DIMENSION_LIST, tid(), sid(), H5P_DEFAULT, H5P_DEFAULT);
149  if (aid < 0) throw Exception("Cannot create attribute", ioda_Here());
150 
152  // Initialize dimlist_in_data to nulls. Used in merge operation later.
153  for (auto & d : dimlist_in_data) {
154  d.len = 0;
155  d.p = nullptr;
156  }
157  } else {
158  // Read
159  if (H5Aread(aDimList.get()(), tid(), static_cast<void*>(dimlist_in_data.data())) < 0)
160  throw Exception("Cannot read attribute", ioda_Here());
161  }
162 
163  // Allocate a new list that combines any previous DIMENSION_LIST with ref_axis.
164  vector<hvl_t> dimlist_out_data(dims.dimensionality);
165  // Merge the new allocations with any previous DIMENSION_LIST entries.
166  // NOTE: Memory is explicitly freed at the end of the function. Since we are
167  // using pure C function calls, throws will not happen even if we run out of memory.
168  for (size_t dim = 0; dim < gsl::narrow<size_t>(dims.dimensionality); ++dim) {
169  View_hvl_t<hobj_ref_t> olddims(dimlist_in_data[dim]);
170  const std::vector<ref_t>& newdims = new_dim_list[dim];
171  View_hvl_t<hobj_ref_t> outdims(dimlist_out_data[dim]);
172 
173  // TODO(ryan)!!!!!
174  // When merging, check if any references are equal.
175  // Given our intended usage of this function, this may never happen.
176 
177  // Note the names here. old + new = out;
178  outdims.resize(olddims.size() + newdims.size());
179  for (size_t i = 0; i < olddims.size(); ++i) {
180  *outdims[i] = *olddims[i];
181  }
182  for (size_t i = 0; i < newdims.size(); ++i) {
183  *outdims[i + olddims.size()] = newdims[i];
184  }
185  }
186 
187  // Write the new list. Deallocate the "old" lists after write, and then check for any errors.
188  // Pure C code in between, so the deallocation always occurs.
189  herr_t write_success = H5Awrite(aDimList.get()(), tid(), static_cast<void*>(dimlist_out_data.data()));
190 
191  // Deallocate old memory
192  H5Dvlen_reclaim(tid.get(), sid.get(), H5P_DEFAULT, reinterpret_cast<void*>(dimlist_in_data.data()));
193  for (size_t dim = 0; dim < gsl::narrow<size_t>(dims.dimensionality); ++dim) {
194  View_hvl_t<hobj_ref_t> outdims(dimlist_out_data[dim]);
195  // The View_hvl_t is a "view" that allows us to reinterpret dimlist_out_data[dim]
196  // as a sequence of hobj_ref_t objects.
197  // We use the resize method to trigger a deliberate free of held memory
198  // that can result from the above merge step.
199  outdims.resize(0);
200  }
201 
202  if (write_success < 0) throw Exception("Failed to write DIMENSION_LIST.", ioda_Here());
203 }
204 
207  if (!tid.isValid()) {
208  // The attribute's datatype
209  if ((tid = H5Tcreate(H5T_COMPOUND, sizeof(ds_list_t))).get() < 0)
210  throw Exception("Cannot create compound datatype.", ioda_Here());
211  if (H5Tinsert(tid(), "dataset", HOFFSET(ds_list_t, ref), H5T_STD_REF_OBJ) < 0)
212  throw Exception("Cannot create compound datatype.", ioda_Here());
213  if (H5Tinsert(tid(), "dimension", HOFFSET(ds_list_t, dim_idx), H5T_NATIVE_INT) < 0)
214  throw Exception("Cannot create compound datatype.", ioda_Here());
215  }
216  return tid;
217 }
218 
221 
222  // dimension of the "REFERENCE_LIST" array
223  const hsize_t hdims[1] = {numrefs};
224  // The attribute's dataspace
225  if ((sid = H5Screate_simple(1, hdims, NULL)).get() < 0)
226  throw Exception("Cannot create simple dataspace.", ioda_Here());
227  return sid;
228 }
229 
230 void attr_update_reference_list(HH_Variable* scale, const std::vector<ds_list_t>& ref_var_axis) {
231  using std::vector;
233  hid_t scale_id = scale->get()();
234 
235  // The REFERENCE_LIST attribute must be deleted and re-created each time
236  // new references are added.
237  // For the append operation, first check whether the attribute exists.
238  vector<ds_list_t> oldrefs;
239  HH_Attribute aDimListOld
240  = iterativeAttributeSearchAndOpen(scale_id, H5O_TYPE_DATASET, REFERENCE_LIST);
241  if (aDimListOld.get().isValid()) {
242  oldrefs.resize(gsl::narrow<size_t>(aDimListOld.getDimensions().numElements));
243  if (H5Aread(aDimListOld.get()(), type(), oldrefs.data()) < 0)
244  throw Exception("Cannot read REFERENCE_LIST attribute.", ioda_Here());
245  // Release the object handle and delete the attribute.
246  aDimListOld = HH_Attribute();
247  scale->atts.remove(REFERENCE_LIST);
248  }
249 
250  vector<ds_list_t> refs = oldrefs;
251  refs.reserve(ref_var_axis.size() + oldrefs.size());
252  std::copy(ref_var_axis.begin(), ref_var_axis.end(), std::back_inserter(refs));
253 
254  // Create the new REFERENCE_LIST attribute.
255  HH_hid_t sid = attr_reference_list_space(gsl::narrow<hsize_t>(refs.size()));
256  hid_t aid = H5Acreate(scale_id, REFERENCE_LIST, type(), sid(), H5P_DEFAULT, H5P_DEFAULT);
257  if (aid < 0) throw Exception("Cannot create new REFERENCE_LIST attribute.", ioda_Here());
259  if (H5Awrite(newAtt.get()(), type(), static_cast<void*>(refs.data())) < 0)
260  throw Exception("Cannot write REFERENCE_LIST attribute.", ioda_Here());
261 }
262 
263 std::string getNameFromIdentifier(hid_t obj_id) {
264  ssize_t sz = H5Iget_name(obj_id, nullptr, 0);
265  if (sz < 0) throw Exception("Cannot get object name", ioda_Here());
266  std::vector<char> data(sz + 1, 0);
267  ssize_t ret = H5Iget_name(obj_id, data.data(), data.size());
268  if (ret < 0) throw Exception("Cannot get object name", ioda_Here());
269  return std::string(data.data());
270 }
271 
272 } // namespace HH
273 } // namespace Engines
274 } // namespace detail
275 } // namespace ioda
IODA's error system.
HDF5 engine implementation of Attribute.
Utility functions for HDF5.
HDF5 engine implementation of Variable.
HDF5 resource handles in C++.
The ioda exception class.
Definition: Exception.h:54
This is the implementation of Attributes using HDF5.
Definition: HH-attributes.h:30
Dimensions getDimensions() const final
Get Attribute's dimensions.
This is the implementation of Variables using HDF5.
Definition: HH-variables.h:40
Dimensions getDimensions() const final
A class to wrap HDF5's hid_t resource handles.
Definition: Handles.h:92
virtual void remove(const std::string &attname)
Delete an Attribute with the specified name.
Has_Attributes atts
Attributes.
Definition: Variable.h:71
IODA_HIDDEN std::string getNameFromIdentifier(hid_t obj_id)
Gets a variable / group / link name from an id. Useful for debugging.
Definition: HH-util.cpp:263
IODA_HIDDEN std::pair< bool, hsize_t > iterativeAttributeSearch(hid_t baseObject, const char *attname, H5_index_t iteration_type)
Linear search to find an attribute.
Definition: HH-util.cpp:82
HH_hid_t attr_reference_list_space(hsize_t numrefs)
Definition: HH-util.cpp:219
HH_hid_t attr_reference_list_type()
Definition: HH-util.cpp:205
IODA_HIDDEN herr_t iterate_find_attr(hid_t loc_id, const char *name, void *op_data)
Callback function for H5Aiterate / H5Aiterate2 / H5Aiterate1.
Definition: HH-util.cpp:37
IODA_HIDDEN void attr_update_reference_list(HH_Variable *scale, const std::vector< ds_list_t > &ref_var_axis)
Attribute REFERENCE_LIST update function.
Definition: HH-util.cpp:230
IODA_HIDDEN HH_Attribute iterativeAttributeSearchAndOpen(hid_t baseObject, H5O_type_t objType, const char *attname)
Linear search to find and open an attribute, if it exists.
Definition: HH-util.cpp:100
IODA_HIDDEN void attr_update_dimension_list(HH_Variable *var, const std::vector< std::vector< ref_t >> &new_dim_list)
Attribute DIMENSION_LIST update function.
Definition: HH-util.cpp:126
IODA_HIDDEN H5_index_t getAttrCreationOrder(hid_t obj, H5O_type_t objType)
Determine attribute creation order for a dataset.
Definition: HH-util.cpp:55
IODA_DL void copy(const ObjectSelection &from, ObjectSelection &to, const ScaleMapping &scale_map)
Generic data copying function.
Definition: Copying.cpp:63
#define ioda_Here()
Dimensions_t numElements
Definition: Dimensions.h:26
Data to pass to/from iterator classes.
Definition: HH-util.h:48
A "view" of hvl_t objects. Adds C++ conveniences to an otherwise troublesome class.
Definition: HH-util.h:134
Duplicate the HDF5 dataset list structure for REFERENCE_LISTs.
Definition: HH-util.h:42