IODA
ioda.py
Go to the documentation of this file.
1 import ioda._ioda_python as _iodapy
2 import datetime as dt
3 import numpy as np
4 import os
5 
6 class ObsSpace:
7 
8  def __repr__(self):
9  return f"ObsSpace({self.name},{self.iodafile})"
10 
11  def __str__(self):
12  return f"IODA ObsSpace Object - {self.name}"
13 
14  def __init__(self, path, dim_dict=None, mode='r', name="NoName", iodalayout=0):
15  self.namename = name
16  if mode not in ['r', 'w' ,'rw']:
17  raise TypeError(f"{mode} not one of 'r','w','rw'")
18  self.writewrite = True if 'w' in mode else False
19  self.readread = True if 'r' in mode else False
20  if os.path.isfile(path) and self.readread:
21  self.iodafileiodafile = path
22  elif os.path.exists(os.path.dirname(path)) and self.writewrite:
23  self.iodafileiodafile = path
24  else:
25  raise OSError(f"{path} does not specify a valid path to a file")
26  self.iodalayoutiodalayout = iodalayout
27  # read obsgroup from IODA
28  if self.readread:
29  self.file, self.obsgroupobsgroup = self._read_obsgroup_read_obsgroup(self.iodafileiodafile)
30  self._def_classvars_def_classvars()
31  else:
32  if dim_dict is not None:
33  self.file, self.obsgroupobsgroup = self._create_obsgroup_create_obsgroup(self.iodafileiodafile, dim_dict)
34  else:
35  raise TypeError("dim_dict is not defined")
36 
37  def _def_classvars(self):
38  # define some variables
39  self.dimensionsdimensions = self.obsgroupobsgroup.vars.list()
40  self.groupsgroups = self.file.listGroups(recurse=True)
41  self.attrsattrs = self.obsgroupobsgroup.atts.list()
42  self.nlocsnlocs = len(self.obsgroupobsgroup.vars.open('nlocs').readVector.int())
43  self.variablesvariables = self.file.listVars(recurse=True)
44  self.nvarsnvars = len(self.variablesvariables)
45 
46  def write_attr(self, attrName, attrVal):
47  # get type of variable
48  try:
49  attrType = self.NumpyToIodaDtypeNumpyToIodaDtype(attrVal)
50  if attrType == _iodapy.Types.float:
51  if np.array(attrVal).size == 1:
52  self.obsgroupobsgroup.atts.create(attrName, attrType,
53  [1]).writeDatum.float(attrVal)
54  else:
55  self.obsgroupobsgroup.atts.create(attrName, attrType,
56  len(attrVal)).writeVector.float(attrVal)
57  elif attrType == _iodapy.Types.double:
58  if np.array(attrVal).size == 1:
59  self.obsgroupobsgroup.atts.create(attrName, attrType,
60  [1]).writeDatum.double(attrVal)
61  else:
62  self.obsgroupobsgroup.atts.create(attrName, attrType,
63  len(attrVal)).writeVector.double(attrVal)
64  elif attrType == _iodapy.Types.int64:
65  if np.array(attrVal).size == 1:
66  self.obsgroupobsgroup.atts.create(attrName, attrType,
67  [1]).writeDatum.int64(attrVal)
68  else:
69  self.obsgroupobsgroup.atts.create(attrName, attrType,
70  len(attrVal)).writeVector.int64(attrVal)
71  elif attrType == _iodapy.Types.int32:
72  if np.array(attrVal).size == 1:
73  self.obsgroupobsgroup.atts.create(attrName, attrType,
74  [1]).writeDatum.int32(attrVal)
75  else:
76  self.obsgroupobsgroup.atts.create(attrName, attrType,
77  len(attrVal)).writeVector.int32(attrVal)
78  # add other elif here TODO
79  except AttributeError: # if string
80  if (type(attrVal) == str):
81  attrType = _iodapy.Types.str
82  self.obsgroupobsgroup.atts.create(
83  attrName, attrType, [1]).writeDatum.str(attrVal)
84 
85  def _read_obsgroup(self, path):
86  # open the obs group for a specified file and return file and obsgroup objects
87  if self.writewrite:
88  iodamode = _iodapy.Engines.BackendOpenModes.Read_Write
89  else:
90  iodamode = _iodapy.Engines.BackendOpenModes.Read_Only
91  g = _iodapy.Engines.HH.openFile(
92  name=path,
93  mode=iodamode,
94  )
95  dlp = _iodapy.DLP.DataLayoutPolicy.generate(
96  _iodapy.DLP.DataLayoutPolicy.Policies(self.iodalayoutiodalayout))
97  og = _iodapy.ObsGroup(g, dlp)
98  return g, og
99 
100  def _create_obsgroup(self, path, dim_dict):
101  # open a new file for writing and return file and obsgroup objects
102  g = _iodapy.Engines.HH.createFile(
103  name=path,
104  mode=_iodapy.Engines.BackendCreateModes.Truncate_If_Exists,
105  )
106  # create list of dims in obs group
107  _dim_list = []
108  for key, value in dim_dict.items():
109  if key == 'nlocs':
110  _nlocs_var = _iodapy.NewDimensionScale.int32(
111  'nlocs', value, _iodapy.Unlimited, value)
112  _dim_list.append(_nlocs_var)
113  else:
114  _dim_list.append(_iodapy.NewDimensionScale.int32(
115  key, value, value, value))
116  # create obs group
117  og = _iodapy.ObsGroup.generate(g, _dim_list)
118  # default compression option
119  self._p1_p1 = _iodapy.VariableCreationParameters()
120  self._p1_p1.compressWithGZIP()
121  return g, og
122 
123  def create_var(self, varname, groupname=None, dtype=np.dtype('float32'), dim_list=['nlocs']):
124  dtype_tmp = np.array([],dtype=dtype)
125  typeVar = self.NumpyToIodaDtypeNumpyToIodaDtype(dtype_tmp)
126  _varstr = varname
127  if groupname is not None:
128  _varstr = f"{groupname}/{varname}"
129  # get list of dimension variables
130  dims = [self.obsgroupobsgroup.vars.open(dim) for dim in dim_list]
131  newVar = self.file.vars.create(_varstr, typeVar,
132  scales=dims, params=self._p1_p1)
133 
134  def Variable(self, varname, groupname=None):
135  return self._Variable_Variable(self, varname, groupname)
136 
137  def NumpyToIodaDtype(self, NumpyArr):
138  ############################################################
139  # This method converts the numpy data type to the
140  # corresponding ioda datatype
141 
142  NumpyDtype = NumpyArr.dtype
143 
144  if (NumpyDtype == np.dtype('float64')):
145  IodaDtype = _iodapy.Types.double # convert double to float
146  elif (NumpyDtype == np.dtype('float32')):
147  IodaDtype = _iodapy.Types.float
148  elif (NumpyDtype == np.dtype('int64')):
149  IodaDtype = _iodapy.Types.int64 # convert long to int
150  elif (NumpyDtype == np.dtype('int32')):
151  IodaDtype = _iodapy.Types.int32
152  elif (NumpyDtype == np.dtype('int16')):
153  IodaDtype = _iodapy.Types.int16
154  elif (NumpyDtype == np.dtype('int8')):
155  IodaDtype = _iodapy.Types.int16
156  elif (NumpyDtype == np.dtype('S1')):
157  IodaDtype = _iodapy.Types.str
158  elif (NumpyDtype == np.dtype('object')):
159  IodaDtype = _iodapy.Types.str
160  else:
161  try:
162  a = str(NumpyArr[0])
163  IodaDtype = _iodapy.Types.str
164  except TypeError:
165  print("ERROR: Unrecognized numpy data type: ", NumpyDtype)
166  exit(-2)
167  return IodaDtype
168 
169  class _Variable:
170  def __repr__(self):
171  return f"IODA variable ({self._varstr})"
172 
173  def __str__(self):
174  return f"IODA variable object - {self._varstr}"
175 
176  def __init__(self, obsspace, varname, groupname=None):
177  self.obsspaceobsspace = obsspace
178  self._varstr_varstr = varname
179  if groupname is not None:
180  self._varstr_varstr = f"{groupname}/{varname}"
181  self._iodavar_iodavar = self.obsspaceobsspace.obsgroup.vars.open(self._varstr_varstr)
182  self.attrsattrs = self._iodavar_iodavar.atts.list()
183 
184  def write_data(self, npArray):
185  datatype = self.obsspaceobsspace.NumpyToIodaDtype(npArray)
186  if datatype == _iodapy.Types.float:
187  self._iodavar_iodavar.writeNPArray.float(npArray)
188  elif datatype == _iodapy.Types.double:
189  self._iodavar_iodavar.writeNPArray.double(npArray)
190  elif datatype == _iodapy.Types.int64:
191  self._iodavar_iodavar.writeNPArray.int64(npArray)
192  elif datatype == _iodapy.Types.int32:
193  self._iodavar_iodavar.writeNPArray.int32(npArray)
194  elif datatype == _iodapy.Types.str:
195  self._iodavar_iodavar.writeVector.str(npArray)
196  # add other elif here TODO
197 
198  def write_attr(self, attrName, attrVal):
199  # get type of variable
200  try:
201  attrType = self.obsspaceobsspace.NumpyToIodaDtype(attrVal)
202  if attrType == _iodapy.Types.float:
203  if len(attrVal) == 1:
204  self._iodavar_iodavar.atts.create(attrName, attrType,
205  [1]).writeDatum.float(attrVal)
206  else:
207  self._iodavar_iodavar.atts.create(attrName, attrType,
208  len(attrVal)).writeVector.float(attrVal)
209  elif attrType == _iodapy.Types.double:
210  if len(attrVal) == 1:
211  self._iodavar_iodavar.atts.create(attrName, attrType,
212  [1]).writeDatum.double(attrVal)
213  else:
214  self._iodavar_iodavar.atts.create(attrName, attrType,
215  len(attrVal)).writeVector.double(attrVal)
216  elif attrType == _iodapy.Types.int64:
217  if len(attrVal) == 1:
218  self._iodavar_iodavar.atts.create(attrName, attrType,
219  [1]).writeDatum.int64(attrVal)
220  else:
221  self._iodavar_iodavar.atts.create(attrName, attrType,
222  len(attrVal)).writeVector.int64(attrVal)
223  elif attrType == _iodapy.Types.int32:
224  if len(attrVal) == 1:
225  self._iodavar_iodavar.atts.create(attrName, attrType,
226  [1]).writeDatum.int32(attrVal)
227  else:
228  self._iodavar_iodavar.atts.create(attrName, attrType,
229  len(attrVal)).writeVector.int32(attrVal)
230  # add other elif here TODO
231  except AttributeError: # if string
232  if (type(attrVal) == str):
233  attrType = _iodapy.Types.str
234  self._iodavar_iodavar.atts.create(
235  attrName, attrType, [1]).writeDatum.str(attrVal)
236 
237  def read_data(self):
238  """
239  returns numpy array/python list of variable data
240  """
241  # figure out what datatype the variable is
242  if self._iodavar_iodavar.isA2(_iodapy.Types.float):
243  # float
244  data = self._iodavar_iodavar.readNPArray.float()
245  data[np.abs(data) > 9e36] = np.nan # undefined values
246  elif self._iodavar_iodavar.isA2(_iodapy.Types.int):
247  # integer
248  data = self._iodavar_iodavar.readNPArray.int()
249  elif self._iodavar_iodavar.isA2(_iodapy.Types.str):
250  # string
251  data = self._iodavar_iodavar.readVector.str() # ioda cannot read str to datetime...
252  # convert to datetimes if applicable
253  if "datetime" in self._varstr_varstr:
254  data = self._str_to_datetime_str_to_datetime(data)
255  else:
256  raise TypeError(f"Variable {self._varstr} type not supported")
257  # reshape if it is a 2D array with second dim size 1
258  try:
259  if data.shape[1] == 1:
260  data = data.flatten()
261  except (IndexError, AttributeError):
262  pass
263  return data
264 
265  def _str_to_datetime(self, datain):
266  # comes as a list of strings, need to
267  # make into datetime objects
268  datetimes = [dt.datetime.strptime(x, "%Y-%m-%dT%H:%M:%SZ") for x in datain]
269  return np.array(datetimes)
def _str_to_datetime(self, datain)
Definition: ioda.py:265
def __init__(self, obsspace, varname, groupname=None)
Definition: ioda.py:176
def write_attr(self, attrName, attrVal)
Definition: ioda.py:198
def write_data(self, npArray)
Definition: ioda.py:184
def __repr__(self)
Definition: ioda.py:8
def NumpyToIodaDtype(self, NumpyArr)
Definition: ioda.py:137
def _read_obsgroup(self, path)
Definition: ioda.py:85
def _create_obsgroup(self, path, dim_dict)
Definition: ioda.py:100
def Variable(self, varname, groupname=None)
Definition: ioda.py:134
def create_var(self, varname, groupname=None, dtype=np.dtype('float32'), dim_list=['nlocs'])
Definition: ioda.py:123
def _def_classvars(self)
Definition: ioda.py:37
def __str__(self)
Definition: ioda.py:11
def write_attr(self, attrName, attrVal)
Definition: ioda.py:46
def __init__(self, path, dim_dict=None, mode='r', name="NoName", iodalayout=0)
Definition: ioda.py:14