Loading [MathJax]/extensions/tex2jax.js
IODA
All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Friends Macros Modules Pages
src/distribution/Distribution.h
Go to the documentation of this file.
1 /*
2  * (C) Copyright 2017 UCAR
3  *
4  * This software is licensed under the terms of the Apache Licence Version 2.0
5  * which can be obtained at http://www.apache.org/licenses/LICENSE-2.0.
6  */
7 
8 #ifndef DISTRIBUTION_DISTRIBUTION_H_
9 #define DISTRIBUTION_DISTRIBUTION_H_
10 
11 #include <memory>
12 #include <vector>
13 
14 #include "eckit/config/Configuration.h"
15 #include "eckit/exception/Exceptions.h"
16 #include "eckit/geometry/Point2.h"
17 #include "eckit/mpi/Comm.h"
18 #include "oops/util/missingValues.h"
19 #include "oops/util/TypeTraits.h"
20 
21 namespace util {
22 class DateTime;
23 }
24 
25 namespace ioda {
26 
27 template <typename T>
28 class Accumulator;
29 
30 // ---------------------------------------------------------------------
31 /*!
32  * \brief class for distributing obs across multiple process elements
33  *
34  * \details This Distribution class is a base class where various subclasses of
35  * this class define different methods for distributing obs.
36  *
37  * The subclasses of this base class need to implement all pure virtual functions.
38  * The client will use the isMyRecord method to determine what records to keep
39  * when reading in observations.
40  *
41  * assignRecord() must be called before isMyRecord() can be called.
42  * computePatchLocs() should be called when all records have been assigned.
43  *
44  * for distributions with observations duplicated on multiple PEs
45  * (currently Inefficient and Halo) the following terminology/logic is used:
46  * the set of obs on each PE is called halo obs. (as in within a halo of some location)
47  * obs in the halo set can be duplicated across multiple PEs
48  * the subset of halo obs. (patch obs.) "belong" only to this PE and are used to
49  * compute reduce operations without duplication.
50  * patch obs form complete, non-overlapping partition of the global set of obs.
51  *
52  * \author Xin Zhang (JCSDA)
53  *
54  * \see Functions defined in DistributionUtils.h.
55  */
56 class Distribution {
57  public:
58  explicit Distribution(const eckit::mpi::Comm & Comm);
59  virtual ~Distribution();
60 
61  /*!
62  * \brief Returns true if the distribution assigns all records to all PEs, false otherwise.
63  */
64  virtual bool isIdentity() const { return false; }
65 
66  /*!
67  * \brief Returns true if the distribution does not assign any record to more than one PE,
68  * false otherwise.
69  */
70  virtual bool isNonoverlapping() const { return false; }
71 
72  /*!
73  * \brief If the record \p RecNum has not yet been assigned to a PE, assigns it to the
74  * appropriate PE. Informs the distribution that location \p LocNum belongs to this record.
75  *
76  * \param RecNum Record containing the location \p LocNum.
77  * \param LocNum (Global) location index.
78  * \param point Latitude and longitude of this location.
79  */
80  virtual void assignRecord(const std::size_t RecNum, const std::size_t LocNum,
81  const eckit::geometry::Point2 & point) {}
82 
83  /*!
84  * \brief Returns true if record \p RecNum has been assigned to the calling PE during a
85  * previous call to assignRecord().
86  *
87  * Clients can use this function to determine which records to keep when reading in
88  * observations.
89  */
90  virtual bool isMyRecord(std::size_t RecNum) const = 0;
91 
92  /*!
93  * \brief If necessary, identifies locations of "patch obs", i.e. locations belonging to
94  * records owned by this PE.
95  *
96  * This function must be called when all records have been assigned, and in particular
97  * before any calls to the createAccumulator() and globalUniqueConsecutiveLocationIndex()
98  * member functions or the global functions and dotProduct(), globalNumNonMissingObs().
99  */
100  virtual void computePatchLocs() {}
101 
102  /*!
103  * \brief Sets each element of the provided vector to true if the corresponding location is a
104  * "patch obs", i.e. it belongs to a record owned by this PE, and to false otherwise.
105  *
106  * \param isPatchObs Preallocated vector of as many elements as there are locations on this PE.
107  */
108  virtual void patchObs(std::vector<bool> & isPatchObs) const = 0;
109 
110  /*!
111  * \brief Calculates the global minimum (over all locations on all PEs) of a
112  * location-dependent quantity.
113  *
114  * \param[inout] x
115  * On input, the local minimum (over all locations on the current PE) of a location-dependent
116  * quantity. On output, its global minimum.
117  */
118  virtual void min(int & x) const = 0;
119  virtual void min(std::size_t & x) const = 0;
120  virtual void min(float & x) const = 0;
121  virtual void min(double & x) const = 0;
122 
123  /*!
124  * \brief Calculates the global minima (over all locations on all PEs) of multiple
125  * location-dependent quantities.
126  *
127  * \param[inout] x
128  * On input, each element of `x` should be the local minimum (over all locations on the
129  * current PE) of a location-dependent quantity. On output, that element will be set to the
130  * global minimum of that quantity.
131  */
132  virtual void min(std::vector<int> & x) const = 0;
133  virtual void min(std::vector<std::size_t> & x) const = 0;
134  virtual void min(std::vector<float> & x) const = 0;
135  virtual void min(std::vector<double> & x) const = 0;
136 
137  /*!
138  * \brief Calculates the global maximum (over all locations on all PEs) of a
139  * location-dependent quantity.
140  *
141  * \param[inout] x
142  * On input, the local maximum (over all locations on the current PE) of a location-dependent
143  * quantity. On output, its global maximum.
144  */
145  virtual void max(int & x) const = 0;
146  virtual void max(std::size_t & x) const = 0;
147  virtual void max(float & x) const = 0;
148  virtual void max(double & x) const = 0;
149 
150  /*!
151  * \brief Calculates the global maxima (over all locations on all PEs) of multiple
152  * location-dependent quantities.
153  *
154  * \param[inout] x
155  * On input, each element of `x` should be the local maximum (over all locations on the
156  * current PE) of a location-dependent quantity. On output, that element will be set to the
157  * global maximum of that quantity.
158  */
159  virtual void max(std::vector<int> & x) const = 0;
160  virtual void max(std::vector<std::size_t> & x) const = 0;
161  virtual void max(std::vector<float> & x) const = 0;
162  virtual void max(std::vector<double> & x) const = 0;
163 
164  /*!
165  * \brief Create an object that can be used to calculate the sum of a location-dependent
166  * quantity over locations held on all PEs, each taken into account only once even if it's
167  * held on multiple PEs.
168  *
169  * \tparam T
170  * Must be either `int`, `size_t`, `float` or `double`.
171  * \param init
172  * Used only to select the right overload -- the value is ignored.
173  */
174  template <typename T>
175  std::unique_ptr<Accumulator<T>> createAccumulator() const {
176  static_assert(util::any_is_same<T, int, std::size_t, float, double>::value,
177  "in the call to createAccumulator<T>(), "
178  "T must be int, size_t, float or double");
179  return createAccumulatorImpl(T());
180  }
181 
182  /*!
183  * \brief Create an object that can be used to calculate the sums of `n`
184  * location-dependent quantities over locations held on all PEs, each taken into account only
185  * once even if it's held on multiple PEs.
186  *
187  * \tparam T
188  * Must be either `int`, `size_t`, `float` or `double`.
189  * \param n
190  * The number of quantities to be summed up.
191  */
192  template <typename T>
193  std::unique_ptr<Accumulator<std::vector<T>>> createAccumulator(std::size_t n) const {
194  static_assert(util::any_is_same<T, int, std::size_t, float, double>::value,
195  "in the call to createAccumulator<T>(size_t n), "
196  "T must be int, size_t, float or double");
197  return createAccumulatorImpl(std::vector<T>(n));
198  }
199 
200  /*!
201  * \brief Gather observation data from all processes and deliver the combined data to
202  * all processes.
203  *
204  * \param[inout] x
205  * On input: a vector whose ith element is associated with the ith observation held by the
206  * calling process.
207  * On output: a concatenation of the vectors `x` passed by all calling processes, with
208  * duplicates removed (i.e. if any observations are duplicated across multiple processes, the
209  * elements of `x` corresponding to these data are included only once).
210  */
211  virtual void allGatherv(std::vector<size_t> &x) const = 0;
212  virtual void allGatherv(std::vector<int> &x) const = 0;
213  virtual void allGatherv(std::vector<float> &x) const = 0;
214  virtual void allGatherv(std::vector<double> &x) const = 0;
215  virtual void allGatherv(std::vector<util::DateTime> &x) const = 0;
216  virtual void allGatherv(std::vector<std::string> &x) const = 0;
217 
218  /*!
219  * \brief Map the index of a location held on the calling process to the index of the
220  * corresponding element of any vector produced by allGatherv().
221  */
222  virtual size_t globalUniqueConsecutiveLocationIndex(size_t loc) const = 0;
223 
224  // return the name of the distribution
225  virtual std::string name() const = 0;
226 
227  /// Accessor to MPI rank
228  size_t rank() const {return comm_.rank();}
229 
230  private:
231  /*!
232  * \brief Create an object that can be used to calculate the sum of a location-dependent
233  * quantity over locations held on all PEs, each taken into account only once even if it's
234  * held on multiple PEs.
235  *
236  * \param init
237  * Used only to select the right overload -- the value is ignored.
238  */
239  virtual std::unique_ptr<Accumulator<int>>
240  createAccumulatorImpl(int init) const = 0;
241  virtual std::unique_ptr<Accumulator<std::size_t>>
242  createAccumulatorImpl(std::size_t init) const = 0;
243  virtual std::unique_ptr<Accumulator<float>>
244  createAccumulatorImpl(float init) const = 0;
245  virtual std::unique_ptr<Accumulator<double>>
246  createAccumulatorImpl(double init) const = 0;
247 
248  /*!
249  * \brief Create an object that can be used to calculate the sums of multiple
250  * location-dependent quantities over locations held on all PEs, each taken into account only
251  * once even if it's held on multiple PEs.
252  *
253  * \param init
254  * A vector of as many elements as there are sums to calculate. The values of these elements
255  * are ignored.
256  */
257  virtual std::unique_ptr<Accumulator<std::vector<int>>>
258  createAccumulatorImpl(const std::vector<int> & init) const = 0;
259  virtual std::unique_ptr<Accumulator<std::vector<std::size_t>>>
260  createAccumulatorImpl(const std::vector<std::size_t> & init) const = 0;
261  virtual std::unique_ptr<Accumulator<std::vector<float>>>
262  createAccumulatorImpl(const std::vector<float> & init) const = 0;
263  virtual std::unique_ptr<Accumulator<std::vector<double>>>
264  createAccumulatorImpl(const std::vector<double> & init) const = 0;
265 
266  protected:
267  /*! \brief Local MPI communicator */
268  const eckit::mpi::Comm & comm_;
269 };
270 
271 } // namespace ioda
272 
273 #endif // DISTRIBUTION_DISTRIBUTION_H_
class for distributing obs across multiple process elements
virtual void min(std::vector< std::size_t > &x) const =0
virtual bool isIdentity() const
Returns true if the distribution assigns all records to all PEs, false otherwise.
virtual void max(int &x) const =0
Calculates the global maximum (over all locations on all PEs) of a location-dependent quantity.
std::unique_ptr< Accumulator< std::vector< T > > > createAccumulator(std::size_t n) const
Create an object that can be used to calculate the sums of n location-dependent quantities over locat...
virtual void allGatherv(std::vector< size_t > &x) const =0
Gather observation data from all processes and deliver the combined data to all processes.
virtual void max(std::size_t &x) const =0
virtual bool isNonoverlapping() const
Returns true if the distribution does not assign any record to more than one PE, false otherwise.
const eckit::mpi::Comm & comm_
Local MPI communicator.
virtual void allGatherv(std::vector< util::DateTime > &x) const =0
virtual void min(std::vector< double > &x) const =0
virtual std::unique_ptr< Accumulator< int > > createAccumulatorImpl(int init) const =0
Create an object that can be used to calculate the sum of a location-dependent quantity over location...
virtual void allGatherv(std::vector< int > &x) const =0
virtual std::unique_ptr< Accumulator< std::vector< float > > > createAccumulatorImpl(const std::vector< float > &init) const =0
virtual std::unique_ptr< Accumulator< std::vector< double > > > createAccumulatorImpl(const std::vector< double > &init) const =0
virtual void max(double &x) const =0
virtual std::string name() const =0
virtual void patchObs(std::vector< bool > &isPatchObs) const =0
Sets each element of the provided vector to true if the corresponding location is a "patch obs",...
virtual std::unique_ptr< Accumulator< std::size_t > > createAccumulatorImpl(std::size_t init) const =0
virtual void max(std::vector< int > &x) const =0
Calculates the global maxima (over all locations on all PEs) of multiple location-dependent quantitie...
virtual bool isMyRecord(std::size_t RecNum) const =0
Returns true if record RecNum has been assigned to the calling PE during a previous call to assignRec...
size_t rank() const
Accessor to MPI rank.
virtual void allGatherv(std::vector< std::string > &x) const =0
Distribution(const eckit::mpi::Comm &Comm)
Definition: Distribution.cc:19
virtual void min(int &x) const =0
Calculates the global minimum (over all locations on all PEs) of a location-dependent quantity.
virtual void allGatherv(std::vector< double > &x) const =0
virtual void allGatherv(std::vector< float > &x) const =0
virtual ~Distribution()
Definition: Distribution.cc:25
virtual void min(std::vector< float > &x) const =0
virtual void min(std::vector< int > &x) const =0
Calculates the global minima (over all locations on all PEs) of multiple location-dependent quantitie...
virtual void min(std::size_t &x) const =0
virtual void max(float &x) const =0
virtual void min(float &x) const =0
virtual void max(std::vector< std::size_t > &x) const =0
virtual void max(std::vector< double > &x) const =0
virtual void max(std::vector< float > &x) const =0
virtual size_t globalUniqueConsecutiveLocationIndex(size_t loc) const =0
Map the index of a location held on the calling process to the index of the corresponding element of ...
virtual std::unique_ptr< Accumulator< std::vector< std::size_t > > > createAccumulatorImpl(const std::vector< std::size_t > &init) const =0
virtual std::unique_ptr< Accumulator< std::vector< int > > > createAccumulatorImpl(const std::vector< int > &init) const =0
Create an object that can be used to calculate the sums of multiple location-dependent quantities ove...
virtual void assignRecord(const std::size_t RecNum, const std::size_t LocNum, const eckit::geometry::Point2 &point)
If the record RecNum has not yet been assigned to a PE, assigns it to the appropriate PE.
std::unique_ptr< Accumulator< T > > createAccumulator() const
Create an object that can be used to calculate the sum of a location-dependent quantity over location...
virtual void computePatchLocs()
If necessary, identifies locations of "patch obs", i.e.
virtual std::unique_ptr< Accumulator< float > > createAccumulatorImpl(float init) const =0
virtual std::unique_ptr< Accumulator< double > > createAccumulatorImpl(double init) const =0
virtual void min(double &x) const =0