IODA
Variable.h
Go to the documentation of this file.
1 #pragma once
2 /*
3  * (C) Copyright 2020-2021 UCAR
4  *
5  * This software is licensed under the terms of the Apache Licence Version 2.0
6  * which can be obtained at http://www.apache.org/licenses/LICENSE-2.0.
7  */
8 /*! \defgroup ioda_cxx_variable Variables, Data Access, and Selections
9  * \brief The main data storage methods and objects in IODA.
10  * \ingroup ioda_cxx_api
11  *
12  * @{
13  * \file Variable.h
14  * \brief @link ioda_cxx_variable Interfaces @endlink for ioda::Variable and related classes.
15  */
16 #include <cstring>
17 #include <gsl/gsl-lite.hpp>
18 #include <list>
19 #include <map>
20 #include <memory>
21 #include <string>
22 #include <tuple>
23 #include <utility>
24 #include <vector>
25 
27 #include "ioda/Exception.h"
28 #include "ioda/Misc/Eigen_Compat.h"
29 #include "ioda/Python/Var_ext.h"
30 #include "ioda/Types/Marshalling.h"
31 #include "ioda/Types/Type.h"
33 #include "ioda/Variables/Fill.h"
35 #include "ioda/defs.h"
36 
37 namespace ioda {
38 class Attribute;
39 class Variable;
40 struct VariableCreationParameters;
41 
42 struct Named_Variable;
43 
44 namespace detail {
45 class Attribute_Backend;
46 class Variable_Backend;
47 
48 /// \brief Exists to prevent constructor conflicts when passing a backend into
49 /// a frontend object.
50 /// \ingroup ioda_cxx_variable
51 /// \bug Need to add a virtual resize function.
52 template <class Variable_Implementation = Variable>
54 protected:
55  /// Using an opaque object to implement the backend.
56  std::shared_ptr<Variable_Backend> backend_;
57 
58  /// @name General Functions
59  /// @{
60 
61  Variable_Base(std::shared_ptr<Variable_Backend>);
62 
63 public:
64  virtual ~Variable_Base();
65 
66  /// @}
67  /// @name Metadata manipulation
68  /// @{
69 
70  /// Attributes
72 
73  /// @}
74 
75  /// @name General Functions
76  /// @{
77 
78  /// Gets a handle to the underlying object that implements the backend functionality.
79  std::shared_ptr<Variable_Backend> get() const;
80 
81  /// @}
82  /// @name Type-querying Functions
83  /// @{
84 
85  /// Get type
86  virtual Type getType() const;
87  /// Get type
88  inline Type type() const { return getType(); }
89 
90  /// Query the backend and get the type provider.
91  virtual detail::Type_Provider* getTypeProvider() const;
92 
93  /// \brief Convenience function to check a Variable's storage type.
94  /// \param DataType is the type of the data. I.e. float, int, int32_t, uint16_t, std::string, etc.
95  /// \returns True if the type matches
96  /// \returns False (0) if the type does not match
97  /// \throws jedi::xError if an error occurred.
98  template <class DataType>
99  bool isA() const {
101 
102  return isA(templateType);
103  }
104  /// Hand-off to the backend to check equivalence
105  virtual bool isA(Type lhs) const;
106 
107  /// Python compatability function
108  inline bool isA(BasicTypes dataType) const { return isA(Type(dataType, getTypeProvider())); }
109  /// \internal pybind11
110  inline bool _py_isA2(BasicTypes dataType) { return isA(dataType); }
111  /// Convenience function to query type
113 
114  /// @}
115  /// @name Querying Functions for Fill Values, Chunking and Compression
116  /// @{
117 
118  /// @brief Convenience function to get fill value, attributes,
119  /// chunk sizes, and compression in a collective call.
120  /// @details This function has better performance on some engines
121  /// for bulk operations than calling separately.
122  /// @param doAtts includes attributes in the creation parameters.
123  /// @param doDims includes dimension scales in the creation parameters.
124  /// Although dimensions are attributes on some backends, we treat them
125  /// separately in this function.
126  /// @returns the filled-in VariableCreationParameters object
127  virtual VariableCreationParameters getCreationParameters(bool doAtts = true,
128  bool doDims = true) const;
129 
130  /// \brief Check if a variable has a fill value set
131  /// \returns true if a fill value is set, false otherwise.
132  virtual bool hasFillValue() const;
133 
134  /// Remap fill value storage type into this class.
136 
137  /// \brief Retrieve the fill value
138  /// \returns an object of type FillValueData_t that stores
139  /// the fill value. If there is no fill value, then
140  /// FillValueData_t::set_ will equal false. The fill
141  /// value data will be stored in
142  /// FillValueData_t::fillValue_ (for simple types), or in
143  /// FillValueData_t::stringFillValue_ (for strings only).
144  /// \note Recommend querying isA to make sure that you
145  /// are reading the fill value as the correct type.
146  virtual FillValueData_t getFillValue() const;
147 
148  /// \brief Retrieve the chunking options for the Variable.
149  /// \note Not all backends support chunking, but they should
150  /// all store the desired chunk size information in case the
151  /// Variable is copied to a new backend.
152  /// \returns a vector containing the chunk sizes.
153  /// \returns an empty vector if chunking is not used.
154  virtual std::vector<Dimensions_t> getChunkSizes() const;
155 
156  /// \brief Retrieve the GZIP compression options for the Variable.
157  /// \note Not all backends support compression (and those that
158  /// do also require chunking support). They should store this
159  /// information anyways, in case the Variable is copied to
160  /// a new backend.
161  /// \returns a pair indicating 1) whether GZIP is requested and
162  /// 2) the compression level that is desired.
163  virtual std::pair<bool, int> getGZIPCompression() const;
164 
165  /// \brief Retrieve the SZIP compression options for the Variable.
166  /// \note Not all backends support compression (and those that
167  /// do also require chunking support). They should store this
168  /// information anyways, in case the Variable is copied to
169  /// a new backend.
170  /// \returns a tuple indicating 1) whether SZIP is requested,
171  /// 2) PixelsPerBlock, and 3) general SZIP filter option flags.
172  virtual std::tuple<bool, unsigned, unsigned> getSZIPCompression() const;
173 
174  /// @}
175  /// @name Data Space-Querying Functions
176  /// @{
177 
178  // Get dataspace
179  // JEDI_NODISCARD DataSpace getSpace() const;
180 
181  /// Get current and maximum dimensions, and number of total points.
182  /// \note In Python, see the dims property.
183  virtual Dimensions getDimensions() const;
184 
185  /// \brief Resize the variable.
186  /// \note Not all variables are resizable. This depends
187  /// on backend support. For HDF5, the variable must be chunked
188  /// and must not exceed max_dims.
189  /// \note Bad things may happen if a variable's dimension scales
190  /// have different lengths than its dimensions. Resize them
191  /// together, preferably using the ObsSpace resize function.
192  /// \see ObsSpace::resize
193  /// \param newDims are the new dimensions.
194  virtual Variable resize(const std::vector<Dimensions_t>& newDims);
195 
196  /// Attach a dimension scale to this Variable.
197  virtual Variable attachDimensionScale(unsigned int DimensionNumber, const Variable& scale);
198  /// Detach a dimension scale
199  virtual Variable detachDimensionScale(unsigned int DimensionNumber, const Variable& scale);
200  /// Set dimensions (convenience function to several invocations of attachDimensionScale).
201  Variable setDimScale(const std::vector<Variable>& dims);
202  /// Set dimensions (convenience function to several invocations of attachDimensionScale).
203  Variable setDimScale(const std::vector<Named_Variable>& dims);
204  /// Set dimensions (convenience function to several invocations of attachDimensionScale).
205  Variable setDimScale(const Variable& dims);
206  /// Set dimensions (convenience function to several invocations of attachDimensionScale).
207  Variable setDimScale(const Variable& dim1, const Variable& dim2);
208  /// Set dimensions (convenience function to several invocations of attachDimensionScale).
209  Variable setDimScale(const Variable& dim1, const Variable& dim2, const Variable& dim3);
210 
211  /// Is this Variable used as a dimension scale?
212  virtual bool isDimensionScale() const;
213 
214  /// Designate this table as a dimension scale
215  virtual Variable setIsDimensionScale(const std::string& dimensionScaleName);
216  /// Get the name of this Variable's defined dimension scale
217  inline std::string getDimensionScaleName() const {
218  std::string r;
220  return r;
221  }
222  virtual Variable getDimensionScaleName(std::string& res) const;
223 
224  /// Is a dimension scale attached to this Variable in a certain position?
225  virtual bool isDimensionScaleAttached(unsigned int DimensionNumber, const Variable& scale) const;
226 
227  /// \brief Which dimensions are attached at which positions? This function may offer improved
228  /// performance on some backends compared to serial isDimensionScaleAttached calls.
229  /// \param scalesToQueryAgainst is a vector containing the scales. You can pass in
230  /// "tagged" strings that map the Variable to a name.
231  /// If you do not pass in a scale to check against, then this scale will not be checked and
232  /// will not be present in the function output.
233  /// \param firstOnly is specified when only one dimension can be attached to each axis (the
234  /// default).
235  /// \returns a vector with the same length as the variable's dimensionality.
236  /// Each variable dimension in the vector can have one or more attached scales. These scales are
237  /// returned as their own, inner, vector of pair<string, Variable>.
238  virtual std::vector<std::vector<Named_Variable>> getDimensionScaleMappings(
239  const std::list<Named_Variable>& scalesToQueryAgainst,
240  bool firstOnly = true) const;
241 
242  /// @}
243  /// @name Writing Data
244  /// @{
245 
246  /// \brief The fundamental write function. Backends overload this function to implement
247  /// all write operations.
248  ///
249  /// \details This function writes a span of bytes (characters) to the backend attribute
250  /// storage. No type conversions take place here (see the templated conversion function,
251  /// below).
252  ///
253  /// \param data is a span of data.
254  /// \param in_memory_datatype is an opaque (backend-level) object that describes the
255  /// placement of the data in memory. Usually ignorable - needed for complex data structures.
256  /// \param mem_selection is the user's memory layout representing the location where
257  /// the data is read from.
258  /// \param file_selection is the backend's memory layout representing the
259  /// location where the data are written to.
260  /// \throws ioda::xError if data has the wrong size.
261  /// \returns The variable (for chaining).
262  virtual Variable write(gsl::span<char> data, const Type& in_memory_dataType,
263  const Selection& mem_selection = Selection::all,
264  const Selection& file_selection = Selection::all);
265 
266  /// \brief Write the Variable
267  /// \note Ensure that the correct dimension ordering is preserved.
268  /// \note With default parameters, the entire Variable is written.
269  /// \tparam DataType is the type of the data to be written.
270  /// \tparam Marshaller is a class that serializes / deserializes data.
271  /// \tparam TypeWrapper translates DataType into a form that the backend understands.
272  /// \param data is a span of data.
273  /// \param mem_selection is the user's memory layout representing the location where
274  /// the data is read from.
275  /// \param file_selection is the backend's memory layout representing the
276  /// location where the data are written to.
277  /// \throws ioda::xError if data has the wrong size.
278  /// \returns The variable (for chaining).
279  template <class DataType, class Marshaller = Object_Accessor<DataType>,
280  class TypeWrapper = Types::GetType_Wrapper<DataType>>
281  Variable_Implementation write(const gsl::span<DataType> data,
282  const Selection& mem_selection = Selection::all,
283  const Selection& file_selection = Selection::all) {
284  try {
285  Marshaller m;
286  auto d = m.serialize(data);
287  return write(gsl::make_span<char>(
288  const_cast<char*>(reinterpret_cast<const char*>(d->DataPointers.data())),
289  d->DataPointers.size() * sizeof(typename Marshaller::mutable_value_type)),
290  TypeWrapper::GetType(getTypeProvider()), mem_selection, file_selection);
291  } catch (...) {
292  std::throw_with_nested(Exception(ioda_Here()));
293  }
294  }
295 
296  /// \brief Write the Variable
297  /// \note Ensure that the correct dimension ordering is preserved.
298  /// \note With default parameters, the entire Variable is written.
299  /// \tparam DataType is the type of the data to be written.
300  /// \tparam Marshaller is a class that serializes / deserializes data.
301  /// \tparam TypeWrapper translates DataType into a form that the backend understands.
302  /// \param data is a span of data.
303  /// \param mem_selection is the user's memory layout representing the location where
304  /// the data is read from.
305  /// \param file_selection is the backend's memory layout representing the
306  /// location where the data are written to.
307  /// \throws ioda::xError if data has the wrong size.
308  /// \returns The variable (for chaining).
309  template <class DataType, class Marshaller = Object_Accessor<DataType>,
310  class TypeWrapper = Types::GetType_Wrapper<DataType>>
311  Variable_Implementation write(const gsl::span<const DataType> data,
312  const Selection& mem_selection = Selection::all,
313  const Selection& file_selection = Selection::all) {
314  try {
315  Marshaller m;
316  auto d = m.serialize(data);
317  return write(gsl::make_span<char>(
318  const_cast<char*>(reinterpret_cast<const char*>(d->DataPointers.data())),
319  d->DataPointers.size() * sizeof(typename Marshaller::mutable_value_type)),
320  TypeWrapper::GetType(getTypeProvider()), mem_selection, file_selection);
321  } catch (...) {
322  std::throw_with_nested(Exception(ioda_Here()));
323  }
324  }
325 
326  /// \brief Write the variable
327  /// \tparam DataType is the type of the data to be written.
328  /// \tparam Marshaller is a class that serializes / deserializes data.
329  /// \tparam TypeWrapper translates DataType into a form that the backend understands.
330  /// \param data is a span of data.
331  /// \param mem_selection is the user's memory layout representing the location where
332  /// the data is read from.
333  /// \param file_selection is the backend's memory layout representing the
334  /// location where the data are written to.
335  /// \throws ioda::xError if data has the wrong size.
336  /// \returns The variable (for chaining).
337 
338  template <class DataType, class Marshaller = Object_Accessor<DataType>,
339  class TypeWrapper = Types::GetType_Wrapper<DataType>>
340  Variable_Implementation write(const std::vector<DataType>& data,
341  const Selection& mem_selection = Selection::all,
342  const Selection& file_selection = Selection::all) {
343  try {
344  return this->write<DataType, Marshaller, TypeWrapper>(gsl::make_span(data), mem_selection,
345  file_selection);
346  } catch (...) {
347  std::throw_with_nested(Exception(ioda_Here()));
348  }
349  }
350 
351  /// \brief Write an Eigen object (a Matrix, an Array, a Block, a Map).
352  /// \tparam EigenClass is the type of the Eigen object being written.
353  /// \param d is the data to be written.
354  /// \param mem_selection is the user's memory layout representing the location where
355  /// the data is read from.
356  /// \param file_selection is the backend's memory layout representing the
357  /// location where the data are written to.
358  /// \throws ioda::xError on a dimension mismatch.
359  /// \returns the variable
360  template <class EigenClass>
361  Variable_Implementation writeWithEigenRegular(const EigenClass& d,
362  const Selection& mem_selection = Selection::all,
363  const Selection& file_selection = Selection::all) {
364 #if 1 //__has_include("Eigen/Dense")
365  try {
366  typedef typename EigenClass::Scalar ScalarType;
367  // If d is already in Row Major form, then this is optimized out.
368  Eigen::Array<ScalarType, Eigen::Dynamic, Eigen::Dynamic, Eigen::RowMajor> dout;
369  dout.resize(d.rows(), d.cols());
370  dout = d;
371  const auto& dconst = dout; // To make some compilers happy.
372  auto sp = gsl::make_span(dconst.data(), static_cast<int>(d.rows() * d.cols()));
373 
374  return write<ScalarType>(sp, mem_selection, file_selection);
375  } catch (...) {
376  std::throw_with_nested(Exception(ioda_Here()));
377  }
378 #else
379  static_assert(false, "The Eigen headers cannot be found, so this function cannot be used.");
380 #endif
381  }
382 
383  /// \brief Write an Eigen Tensor-like object
384  /// \tparam EigenClass is the type of the Eigen object being written.
385  /// \param d is the data to be written.
386  /// \param mem_selection is the user's memory layout representing the location where
387  /// the data is read from.
388  /// \param file_selection is the backend's memory layout representing the
389  /// location where the data are written to.
390  /// \throws ioda::xError on a dimension mismatch.
391  /// \returns the variable
392  template <class EigenClass>
393  Variable_Implementation writeWithEigenTensor(const EigenClass& d,
394  const Selection& mem_selection = Selection::all,
395  const Selection& file_selection = Selection::all) {
396 #if 1 //__has_include("unsupported/Eigen/CXX11/Tensor")
397  try {
399 
400  auto sp = (gsl::make_span(d.data(), dims.numElements));
401  auto res = write(sp, mem_selection, file_selection);
402  return res;
403  } catch (...) {
404  std::throw_with_nested(Exception(ioda_Here()));
405  }
406 #else
407  static_assert(
408  false, "The Eigen unsupported/ headers cannot be found, so this function cannot be used.");
409 #endif
410  }
411 
412  /// @}
413  /// @name Reading Data
414  /// @{
415 
416  /// \brief Read the Variable - as char array. Ordering is row-major.
417  /// \details This is the fundamental read function that has to be implemented.
418  /// \param data is a byte-array that will hold the read data.
419  /// \param in_memory_dataType describes how ioda should arrange the read data in memory.
420  /// As floats? As doubles? Strings?
421  /// \param mem_selection is the user's memory layout representing the location where
422  /// the data is read from.
423  /// \param file_selection is the backend's memory layout representing the
424  /// location where the data are written to.
425  /// \note Ensure that the correct dimension ordering is preserved
426  /// \note With default parameters, the entire Variable is read
427  virtual Variable read(gsl::span<char> data, const Type& in_memory_dataType,
428  const Selection& mem_selection = Selection::all,
429  const Selection& file_selection = Selection::all) const;
430 
431  /// \brief Read the variable into a span (range) or memory. Ordering is row-major.
432  /// \tparam DataType is the type of the data to be written.
433  /// \tparam Marshaller is a class that serializes / deserializes data.
434  /// \tparam TypeWrapper translates DataType into a form that the backend understands.
435  /// \param data is a byte-array that will hold the read data.
436  /// \param mem_selection is the user's memory layout representing the location where
437  /// the data is read from.
438  /// \param file_selection is the backend's memory layout representing the
439  /// location where the data are written to.
440  /// \todo Add in the dataspaces!
441  template <class DataType, class Marshaller = ioda::Object_Accessor<DataType>,
442  class TypeWrapper = Types::GetType_Wrapper<DataType>>
443  Variable_Implementation read(gsl::span<DataType> data,
444  const Selection& mem_selection = Selection::all,
445  const Selection& file_selection = Selection::all) const {
446  try {
447  const size_t numObjects = data.size();
448  Dimensions_t ne = getDimensions().numElements;
449 
451  Marshaller m(pointerOwner);
452  auto p = m.prep_deserialize(numObjects);
453  read(gsl::make_span<char>(
454  reinterpret_cast<char*>(p->DataPointers.data()),
455  // Logic note: sizeof mutable data type. If we are
456  // reading in a string, then mutable data type is char*,
457  // which works because address pointers have the same size.
458  p->DataPointers.size() * sizeof(typename Marshaller::mutable_value_type)),
459  TypeWrapper::GetType(getTypeProvider()), mem_selection, file_selection);
460  m.deserialize(p, data);
461 
462  return Variable_Implementation{backend_};
463  } catch (...) {
464  std::throw_with_nested(Exception(ioda_Here()));
465  }
466  }
467 
468  /// \brief Read the variable into a vector. Resize if needed. For a non-resizing
469  /// version, use a gsl::span.
470  /// \details Ordering is row-major.
471  /// \tparam DataType is the type of the data to be written.
472  /// \tparam Marshaller is a class that serializes / deserializes data.
473  /// \tparam TypeWrapper translates DataType into a form that the backend understands.
474  /// \param data is a byte-array that will hold the read data.
475  /// \param mem_selection is the user's memory layout representing the location where
476  /// the data is read from.
477  /// \param file_selection is the backend's memory layout representing the
478  /// location where the data are written to.
479  /// \bug Resize only if needed, and resize to the proper extent depending on
480  /// mem_selection and file_selection.
481  template <class DataType, class Marshaller = ioda::Object_Accessor<DataType>,
482  class TypeWrapper = Types::GetType_Wrapper<DataType>>
483  Variable_Implementation read(std::vector<DataType>& data,
484  const Selection& mem_selection = Selection::all,
485  const Selection& file_selection = Selection::all) const {
486  data.resize(getDimensions().numElements); // TODO(Ryan): remove
487  return read<DataType, Marshaller, TypeWrapper>(gsl::make_span(data.data(), data.size()),
488  mem_selection, file_selection);
489  }
490 
491  /// \brief Read the variable into a new vector. Python convenience function.
492  /// \bug Get correct size based on selection operands.
493  /// \tparam DataType is the type of the data to be written.
494  /// \tparam Marshaller is a class that serializes / deserializes data.
495  /// \tparam TypeWrapper translates DataType into a form that the backend understands.
496  /// \param mem_selection is the user's memory layout representing the location where
497  /// the data is read from.
498  /// \param file_selection is the backend's memory layout representing the
499  /// location where the data are written to.
500  template <class DataType, class Marshaller = ioda::Object_Accessor<DataType>,
501  class TypeWrapper = Types::GetType_Wrapper<DataType>>
502  std::vector<DataType> readAsVector(const Selection& mem_selection = Selection::all,
503  const Selection& file_selection = Selection::all) const {
504  std::vector<DataType> data(getDimensions().numElements);
505  read<DataType, Marshaller, TypeWrapper>(gsl::make_span(data.data(), data.size()), mem_selection,
506  file_selection);
507  return data;
508  }
509 
510  /// \brief Valarray read convenience function. Resize if needed.
511  /// For a non-resizing version, use a gsl::span.
512  /// \tparam DataType is the type of the data to be written.
513  /// \tparam Marshaller is a class that serializes / deserializes data.
514  /// \tparam TypeWrapper translates DataType into a form that the backend understands.
515  /// \param data is a valarray acting as a data buffer that is filled with the
516  /// metadata's contents. It gets resized as needed.
517  /// \param mem_selection is the user's memory layout representing the location where
518  /// the data is read from.
519  /// \param file_selection is the backend's memory layout representing the
520  /// location where the data are written to.
521  /// \returns Another instance of this Attribute. Used for operation chaining.
522  /// \note data will be stored in row-major order.
523  template <class DataType, class Marshaller = ioda::Object_Accessor<DataType>,
524  class TypeWrapper = Types::GetType_Wrapper<DataType>>
525  Variable_Implementation read(std::valarray<DataType>& data,
526  const Selection& mem_selection = Selection::all,
527  const Selection& file_selection = Selection::all) const {
528  /// \bug Resize only if needed, and resize to the proper extent depending on
529  /// mem_selection and file_selection.
530  data.resize(getDimensions().numElements); // TODO(Ryan): remove
531  return read<DataType, Marshaller, TypeWrapper>(gsl::make_span(std::begin(data), std::end(data)),
532  mem_selection, file_selection);
533  }
534 
535  /// \brief Read data into an Eigen::Array, Eigen::Matrix, Eigen::Map, etc.
536  /// \tparam EigenClass is a template pointing to the Eigen object.
537  /// This template must provide the EigenClass::Scalar typedef.
538  /// \tparam Resize indicates whether the Eigen object should be resized
539  /// if there is a dimension mismatch. Not all Eigen objects can be resized.
540  /// \param res is the Eigen object.
541  /// \param mem_selection is the user's memory layout representing the location where
542  /// the data is read from.
543  /// \param file_selection is the backend's memory layout representing the
544  /// location where the data are written to.
545  /// \returns Another instance of this Variable. Used for operation chaining.
546  /// \throws ioda::xError if the variable's dimensionality is
547  /// too high.
548  /// \throws ioda::xError if resize = false and there is a dimension mismatch.
549  /// \note When reading in a 1-D object, the data are read as a column vector.
550  template <class EigenClass, bool Resize = detail::EigenCompat::CanResize<EigenClass>::value>
551  Variable_Implementation readWithEigenRegular(EigenClass& res,
552  const Selection& mem_selection = Selection::all,
553  const Selection& file_selection
554  = Selection::all) const {
555  /// \bug Resize only if needed, and resize to the proper extent depending on
556  /// mem_selection and file_selection.
557 #if 1 //__has_include("Eigen/Dense")
558  try {
559  typedef typename EigenClass::Scalar ScalarType;
560 
561  static_assert(
563  "This object cannot be resized, but you have specified that a resize is required.");
564 
565  // Check that the dimensionality is 1 or 2.
566  const auto dims = getDimensions();
567  if (dims.dimensionality > 2)
568  throw Exception("Dimensionality too high for a regular Eigen read. Use "
569  "Eigen::Tensor reads instead.", ioda_Here());
570 
571  int nDims[2] = {1, 1};
572  if (dims.dimsCur.size() >= 1) nDims[0] = gsl::narrow<int>(dims.dimsCur[0]);
573  if (dims.dimsCur.size() >= 2) nDims[1] = gsl::narrow<int>(dims.dimsCur[1]);
574 
575  // Resize if needed.
576  if (Resize)
578  nDims[1]); // nullop if the size is already correct.
579  else if (dims.numElements != (size_t)(res.rows() * res.cols()))
580  throw Exception("Size mismatch", ioda_Here());
581 
582  // Array copy to preserve row vs column major format.
583  // Should be optimized away by the compiler if unneeded.
584  // Note to the reader: We are reading in the data to a temporary object.
585  // We can size _this_ temporary object however we want.
586  // The temporary is used to swap row / column indices if needed.
587  // It should be optimized away if not needed... making sure this happens is a todo.
588  Eigen::Array<ScalarType, Eigen::Dynamic, Eigen::Dynamic, Eigen::RowMajor> data_in(res.rows(),
589  res.cols());
590 
591  auto ret = read<ScalarType>(gsl::span<ScalarType>(data_in.data(), dims.numElements),
592  mem_selection, file_selection);
593  res = data_in;
594  return ret;
595  } catch (...) {
596  std::throw_with_nested(Exception(ioda_Here()));
597  }
598 #else
599  static_assert(false, "The Eigen headers cannot be found, so this function cannot be used.");
600 #endif
601  }
602 
603  /// \brief Read data into an Eigen::Array, Eigen::Matrix, Eigen::Map, etc.
604  /// \tparam EigenClass is a template pointing to the Eigen object.
605  /// This template must provide the EigenClass::Scalar typedef.
606  /// \param res is the Eigen object.
607  /// \param mem_selection is the user's memory layout representing the location where
608  /// the data is read from.
609  /// \param file_selection is the backend's memory layout representing the
610  /// location where the data are written to.
611  /// \returns Another instance of this Variable. Used for operation chaining.
612  /// \throws jedi::xError if there is a size mismatch.
613  /// \note When reading in a 1-D object, the data are read as a column vector.
614  template <class EigenClass>
615  Variable_Implementation readWithEigenTensor(EigenClass& res,
616  const Selection& mem_selection = Selection::all,
617  const Selection& file_selection
618  = Selection::all) const {
619 #if 1 //__has_include("unsupported/Eigen/CXX11/Tensor")
620  try {
621  // Check dimensionality of source and destination
622  const auto ioda_dims = getDimensions();
623  const auto eigen_dims = ioda::detail::EigenCompat::getTensorDimensions(res);
624  if (ioda_dims.numElements != eigen_dims.numElements)
625  throw Exception("Size mismatch for Eigen Tensor-like read.", ioda_Here());
626 
627  auto sp = (gsl::make_span(res.data(), eigen_dims.numElements));
628  return read(sp, mem_selection, file_selection);
629  } catch (...) {
630  std::throw_with_nested(Exception(ioda_Here()));
631  }
632 #else
633  static_assert(
634  false, "The Eigen unsupported/ headers cannot be found, so this function cannot be used.");
635 #endif
636  }
637 
638  /// \internal Python binding function
639  template <class EigenClass>
640  EigenClass _readWithEigenRegular_python(const Selection& mem_selection = Selection::all,
641  const Selection& file_selection = Selection::all) const {
642  EigenClass data;
643  readWithEigenRegular(data, mem_selection, file_selection);
644  return data;
645  }
646 
647  /// @brief Convert a selection into its backend representation
648  /// @param sel is the frontend selection.
649  /// @return The cached backend selection.
651 
652  /// @}
653 };
654 // extern template class Variable_Base<Variable>;
655 } // namespace detail
656 
657 /** \brief Variables store data!
658  * \ingroup ioda_cxx_variable
659  *
660  * A variable represents a single field of data. It can be multi-dimensional and
661  * usually has one or more attached **dimension scales**.
662  *
663  * Variables have Metadata, which describe the variable (i.e. valid_range, long_name, units).
664  * Variables can have different data types (i.e. int16_t, float, double, string, datetime).
665  * Variables can be resized. Depending on the backend, the data in a variable can be stored
666  * using chunks, and may also be compressed.
667  *
668  * The backend manages how variables are stored in memory or on disk. The functions in the
669  * Variable class provide methods to query and set data. The goal is to have data transfers
670  * involve as few copies as possible.
671  *
672  * Variable objects themselves are lightweight handles that may be passed across different
673  * parts of a program. Variables are always stored somewhere in a Group (or ObsSpace), so you
674  * can always re-open a handle.
675  *
676  * \note Thread and MPI safety depend on the specific backends used to implement a variable.
677  * \note A variable may be linked to multiple groups and listed under multiple names, so long as
678  * the storage backends are all the same.
679  **/
680 class IODA_DL Variable : public detail::Variable_Base<Variable> {
681 public:
682  /// @name General Functions
683  /// @{
684 
685  Variable();
686  Variable(std::shared_ptr<detail::Variable_Backend> b);
687  Variable(const Variable&);
688  Variable& operator=(const Variable&);
689  virtual ~Variable();
690 
691  /// @}
692  /// @name Python compatability objects
693  /// @{
694 
696 
699 
702 
704 
705  /// @}
706 };
707 
708 namespace detail {
709 /// \brief Variable backends inherit from this.
710 class IODA_DL Variable_Backend : public Variable_Base<Variable> {
711 public:
712  virtual ~Variable_Backend();
713 
714  /// Default, trivial implementation. Customizable by backends for performance.
715  std::vector<std::vector<Named_Variable>> getDimensionScaleMappings(
716  const std::list<Named_Variable>& scalesToQueryAgainst,
717  bool firstOnly = true) const override;
718 
719  /// Default implementation. Customizable by backends for performance.
720  VariableCreationParameters getCreationParameters(bool doAtts = true,
721  bool doDims = true) const override;
722 
723 protected:
725 
726  /// @brief This function de-encapsulates an Attribute's backend storage object.
727  /// This function is used by Variable_Backend's derivatives when accessing a
728  /// Variable's Attributes. IODA-internal use only.
729  /// @tparam Attribute_Implementation is a dummy parameter used by Attributes.
730  /// @param base is the Attribute whose backend you want.
731  /// @return The encapsulated backend object.
732  template <class Attribute_Implementation = Attribute>
733  static std::shared_ptr<Attribute_Backend> _getAttributeBackend(
734  const Attribute_Implementation& att) {
735  return att.backend_;
736  }
737 
738  /// @brief This function de-encapsulates a Has_Attributes backend storage object.
739  /// IODA-internal use only.
740  /// @tparam Has_Attributes_Implementation is a dummy parameter for template resolution.
741  /// @param hatts is the Has_Attributes whose backend you want.
742  /// @return The encapsulated backend object.
743  template <class Has_Attributes_Implementation = Has_Attributes>
744  static std::shared_ptr<Has_Attributes_Backend> _getHasAttributesBackend(
745  const Has_Attributes_Implementation& hatts) {
746  return hatts.backend_;
747  }
748 };
749 } // namespace detail
750 
751 /// @brief A named pair of (variable_name, ioda::Variable).
753  std::string name;
755  bool operator<(const Named_Variable& rhs) const { return name < rhs.name; }
756 
757  Named_Variable() = default;
758  Named_Variable(const std::string& name, const ioda::Variable& var) : name(name), var(var) {}
759 };
760 
761 } // namespace ioda
762 
763 /// @}
Convenience functions to work with Eigen objects.
IODA's error system.
Fill value getters and setters.
Interfaces for ioda::Has_Attributes and related classes.
Classes and functions that implement the type system and allow for frontend/backend communication.
Dataspace selections for reading and writing ioda::Variable data.
Interfaces for ioda::Type and related classes.
Frontend/backend bindings for the type system.
Python extensions to ioda::Variable.
The ioda exception class.
Definition: Exception.h:54
This class exists inside of ioda::Group or ioda::Variable and provides the interface to manipulating ...
A Selection represents the bounds of the data, in ioda or in userspace, that you are reading or writi...
Definition: Selection.h:48
Represents the "type" (i.e. integer, string, float) of a piece of data.
Definition: Type.h:123
Variables store data!
Definition: Variable.h:680
virtual ~Variable()
detail::python_bindings::VariableReadVector< Variable > _py_readVector
Definition: Variable.h:697
detail::python_bindings::VariableScales< Variable > _py_scales
Definition: Variable.h:703
detail::python_bindings::VariableWriteNPArray< Variable > _py_writeNPArray
Definition: Variable.h:701
detail::python_bindings::VariableWriteVector< Variable > _py_writeVector
Definition: Variable.h:700
detail::python_bindings::VariableIsA< Variable > _py_isA
Definition: Variable.h:695
detail::python_bindings::VariableReadNPArray< Variable > _py_readNPArray
Definition: Variable.h:698
Backends implement type providers in conjunction with Attributes, Has_Attributes, Variables and Has_V...
Definition: Type_Provider.h:36
virtual PointerOwner getReturnedPointerOwner() const
When a pointer is passed from the backend to the frontend, who has to free it?
Variable backends inherit from this.
Definition: Variable.h:710
static std::shared_ptr< Attribute_Backend > _getAttributeBackend(const Attribute_Implementation &att)
This function de-encapsulates an Attribute's backend storage object. This function is used by Variabl...
Definition: Variable.h:733
static std::shared_ptr< Has_Attributes_Backend > _getHasAttributesBackend(const Has_Attributes_Implementation &hatts)
This function de-encapsulates a Has_Attributes backend storage object. IODA-internal use only.
Definition: Variable.h:744
Exists to prevent constructor conflicts when passing a backend into a frontend object.
Definition: Variable.h:53
virtual Variable attachDimensionScale(unsigned int DimensionNumber, const Variable &scale)
Attach a dimension scale to this Variable.
Definition: Variable.cpp:184
Variable setDimScale(const std::vector< Variable > &dims)
Set dimensions (convenience function to several invocations of attachDimensionScale).
Definition: Variable.cpp:212
bool _py_isA2(BasicTypes dataType)
Definition: Variable.h:110
Variable_Implementation readWithEigenTensor(EigenClass &res, const Selection &mem_selection=Selection::all, const Selection &file_selection=Selection::all) const
Read data into an Eigen::Array, Eigen::Matrix, Eigen::Map, etc.
Definition: Variable.h:615
Variable_Implementation write(const gsl::span< const DataType > data, const Selection &mem_selection=Selection::all, const Selection &file_selection=Selection::all)
Write the Variable.
Definition: Variable.h:311
virtual Type getType() const
Get type.
Definition: Variable.cpp:49
virtual FillValueData_t getFillValue() const
Retrieve the fill value.
Definition: Variable.cpp:111
virtual Variable setIsDimensionScale(const std::string &dimensionScaleName)
Designate this table as a dimension scale.
Definition: Variable.cpp:264
virtual std::vector< Dimensions_t > getChunkSizes() const
Retrieve the chunking options for the Variable.
Definition: Variable.cpp:123
Variable_Implementation read(std::vector< DataType > &data, const Selection &mem_selection=Selection::all, const Selection &file_selection=Selection::all) const
Read the variable into a vector. Resize if needed. For a non-resizing version, use a gsl::span.
Definition: Variable.h:483
Variable_Implementation writeWithEigenRegular(const EigenClass &d, const Selection &mem_selection=Selection::all, const Selection &file_selection=Selection::all)
Write an Eigen object (a Matrix, an Array, a Block, a Map).
Definition: Variable.h:361
Variable_Implementation writeWithEigenTensor(const EigenClass &d, const Selection &mem_selection=Selection::all, const Selection &file_selection=Selection::all)
Write an Eigen Tensor-like object.
Definition: Variable.h:393
virtual std::pair< bool, int > getGZIPCompression() const
Retrieve the GZIP compression options for the Variable.
Definition: Variable.cpp:136
std::shared_ptr< Variable_Backend > backend_
Using an opaque object to implement the backend.
Definition: Variable.h:56
bool isA() const
Convenience function to check a Variable's storage type.
Definition: Variable.h:99
Has_Attributes atts
Attributes.
Definition: Variable.h:71
virtual bool isDimensionScaleAttached(unsigned int DimensionNumber, const Variable &scale) const
Is a dimension scale attached to this Variable in a certain position?
Definition: Variable.cpp:288
Variable_Implementation read(std::valarray< DataType > &data, const Selection &mem_selection=Selection::all, const Selection &file_selection=Selection::all) const
Valarray read convenience function. Resize if needed. For a non-resizing version, use a gsl::span.
Definition: Variable.h:525
virtual bool hasFillValue() const
Check if a variable has a fill value set.
Definition: Variable.cpp:98
Variable_Implementation write(const std::vector< DataType > &data, const Selection &mem_selection=Selection::all, const Selection &file_selection=Selection::all)
Write the variable.
Definition: Variable.h:340
virtual bool isDimensionScale() const
Is this Variable used as a dimension scale?
Definition: Variable.cpp:251
virtual Variable detachDimensionScale(unsigned int DimensionNumber, const Variable &scale)
Detach a dimension scale.
Definition: Variable.cpp:198
BasicTypes getBasicType() const
Convenience function to query type.
Type type() const
Get type.
Definition: Variable.h:88
Variable_Implementation read(gsl::span< DataType > data, const Selection &mem_selection=Selection::all, const Selection &file_selection=Selection::all) const
Read the variable into a span (range) or memory. Ordering is row-major.
Definition: Variable.h:443
virtual Dimensions getDimensions() const
Definition: Variable.cpp:160
virtual std::tuple< bool, unsigned, unsigned > getSZIPCompression() const
Retrieve the SZIP compression options for the Variable.
Definition: Variable.cpp:148
std::vector< DataType > readAsVector(const Selection &mem_selection=Selection::all, const Selection &file_selection=Selection::all) const
Read the variable into a new vector. Python convenience function.
Definition: Variable.h:502
virtual std::vector< std::vector< Named_Variable > > getDimensionScaleMappings(const std::list< Named_Variable > &scalesToQueryAgainst, bool firstOnly=true) const
Which dimensions are attached at which positions? This function may offer improved performance on som...
Definition: Variable.cpp:303
Variable_Implementation write(const gsl::span< DataType > data, const Selection &mem_selection=Selection::all, const Selection &file_selection=Selection::all)
Write the Variable.
Definition: Variable.h:281
virtual VariableCreationParameters getCreationParameters(bool doAtts=true, bool doDims=true) const
Convenience function to get fill value, attributes, chunk sizes, and compression in a collective call...
Definition: Variable.cpp:85
virtual detail::Type_Provider * getTypeProvider() const
Query the backend and get the type provider.
Definition: Variable.cpp:37
std::string getDimensionScaleName() const
Get the name of this Variable's defined dimension scale.
Definition: Variable.h:217
virtual Variable read(gsl::span< char > data, const Type &in_memory_dataType, const Selection &mem_selection=Selection::all, const Selection &file_selection=Selection::all) const
Read the Variable - as char array. Ordering is row-major.
Definition: Variable.cpp:330
Variable_Base(std::shared_ptr< Variable_Backend >)
Definition: Variable.cpp:15
bool isA(BasicTypes dataType) const
Python compatability function.
Definition: Variable.h:108
EigenClass _readWithEigenRegular_python(const Selection &mem_selection=Selection::all, const Selection &file_selection=Selection::all) const
Definition: Variable.h:640
virtual Variable write(gsl::span< char > data, const Type &in_memory_dataType, const Selection &mem_selection=Selection::all, const Selection &file_selection=Selection::all)
The fundamental write function. Backends overload this function to implement all write operations.
Definition: Variable.cpp:317
std::shared_ptr< Variable_Backend > get() const
Gets a handle to the underlying object that implements the backend functionality.
Definition: Variable.cpp:21
virtual Variable resize(const std::vector< Dimensions_t > &newDims)
Resize the variable.
Definition: Variable.cpp:172
detail::FillValueData_t FillValueData_t
Remap fill value storage type into this class.
Definition: Variable.h:135
virtual Selections::SelectionBackend_t instantiateSelection(const Selection &sel) const
Convert a selection into its backend representation.
Definition: Variable.cpp:344
Variable_Implementation readWithEigenRegular(EigenClass &res, const Selection &mem_selection=Selection::all, const Selection &file_selection=Selection::all) const
Read data into an Eigen::Array, Eigen::Matrix, Eigen::Map, etc.
Definition: Variable.h:551
Common preprocessor definitions used throughout IODA.
#define IODA_DL
A preprocessor tag that indicates that a symbol is to be exported/imported.
Definition: defs.h:110
Type GetType(gsl::not_null< const ::ioda::detail::Type_Provider * > t, std::initializer_list< Dimensions_t > Adims={}, typename std::enable_if<!is_string< DataType >::value >::type *=0)
For fundamental, non-string types.
Definition: Type.h:189
std::shared_ptr< InstantiatedSelection > SelectionBackend_t
Definition: Selection.h:35
static IODA_DL const Selection all
Definition: Selection.h:131
PointerOwner
Who owns (and should free) pointers passed across the frontend / backend interface?
Definition: Type_Provider.h:27
list newDims
Definition: 05-ObsGroup.py:95
::std::is_base_of< ResizeableBase, EigenClass > CanResize
Definition: Eigen_Compat.h:54
Dimensions getTensorDimensions(EigenClass &e)
Definition: Eigen_Compat.h:72
typename ::std::enable_if< CanResize< EigenClass >::value >::type DoEigenResize(EigenClass &e, ::Eigen::Index rows, ::Eigen::Index cols)
Definition: Eigen_Compat.h:57
BasicTypes
Definition: Type.h:37
#define ioda_Here()
Describes the dimensions of an Attribute or Variable.
Definition: Dimensions.h:22
Dimensions_t numElements
Definition: Dimensions.h:26
A named pair of (variable_name, ioda::Variable).
Definition: Variable.h:752
Named_Variable()=default
Named_Variable(const std::string &name, const ioda::Variable &var)
Definition: Variable.h:758
bool operator<(const Named_Variable &rhs) const
Definition: Variable.h:755
ioda::Variable var
Definition: Variable.h:754
std::string name
Definition: Variable.h:753
static Type GetType(gsl::not_null< const ::ioda::detail::Type_Provider * > t)
Definition: Type.h:280
Used to specify Variable creation-time properties.
Definition: Has_Variables.h:57
Container used to store and manipulate fill values.
Definition: Fill.h:35