IODA
DistributionUtils.h
Go to the documentation of this file.
1 /*
2  * (C) Crown copyright 2021, Met Office
3  *
4  * This software is licensed under the terms of the Apache Licence Version 2.0
5  * which can be obtained at http://www.apache.org/licenses/LICENSE-2.0.
6  */
7 
8 #ifndef DISTRIBUTION_DISTRIBUTIONUTILS_H_
9 #define DISTRIBUTION_DISTRIBUTIONUTILS_H_
10 
11 #include <memory>
12 #include <string>
13 #include <vector>
14 
15 namespace eckit {
16 namespace mpi {
17 class Comm;
18 }
19 }
20 
21 namespace util {
22 class DateTime;
23 }
24 
25 namespace ioda {
26 
27 class Distribution;
28 
29 /// \brief Computes the dot product between two vectors of obs distributed across MPI ranks.
30 ///
31 /// \param distribution
32 /// Distribution used to partition observations across MPI ranks.
33 /// \param numVariables
34 /// Number of variables whose observations are stored in `v1` and `v2`.
35 /// \param v1, v2
36 /// Vectors of observations. Observations of individual variables should be interleaved,
37 /// i.e. the observation of variable `ivar` at location `iloc` in the halo of the calling MPI
38 /// rank should be stored in element `(iloc * numVariables + ivar)` of each vector.
39 ///
40 /// \return The dot product of the two vectors, with observations taken at locations belonging to
41 /// the halos of multiple MPI ranks counted only once and any missing values treated as if they
42 /// were zeros.
43 ///
44 /// \relates Distribution
45 double dotProduct(const Distribution &dist, std::size_t numVariables,
46  const std::vector<double> &v1, const std::vector<double> &v2);
47 double dotProduct(const Distribution &dist, std::size_t numVariables,
48  const std::vector<float> &v1, const std::vector<float> &v2);
49 double dotProduct(const Distribution &dist, std::size_t numVariables,
50  const std::vector<int> &v1, const std::vector<int> &v2);
51 
52 /// \brief Counts unique non-missing observations in a vector.
53 ///
54 /// \param distribution
55 /// Distribution used to partition observations across MPI ranks.
56 /// \param numVariables
57 /// Number of variables whose observations are stored in `v`.
58 /// \param v
59 /// Vector of observations. Observations of individual variables should be interleaved,
60 /// i.e. the observation of variable `ivar` at location `iloc` in the halo of the calling MPI
61 /// rank should be stored at `v[iloc * numVariables + ivar]`.
62 ///
63 /// \return The number of unique observations on all MPI ranks set to something else than the
64 /// missing value indicator. "Unique" means that observations taken at locations belonging to the
65 /// halos of multiple MPI ranks are counted only once.
66 ///
67 /// \relates Distribution
68 std::size_t globalNumNonMissingObs(const Distribution &dist,
69  size_t numVariables, const std::vector<double> &v);
70 std::size_t globalNumNonMissingObs(const Distribution &dist,
71  size_t numVariables, const std::vector<float> &v);
72 std::size_t globalNumNonMissingObs(const Distribution &dist,
73  size_t numVariables, const std::vector<int> &v);
74 std::size_t globalNumNonMissingObs(const Distribution &dist,
75  size_t numVariables, const std::vector<std::string> &v);
76 std::size_t globalNumNonMissingObs(const Distribution &dist,
77  size_t numVariables, const std::vector<util::DateTime> &v);
78 
79 /// \brief Create a suitable replica distribution for the distribution `master`.
80 ///
81 /// A replica distribution assigns each record `r` to a process if and only if another distribution
82 /// (the _master distribution_) has assigned the same record to that process.
83 ///
84 /// \param comm
85 /// Communicator used by the master distribution.
86 /// \param master
87 /// Master distribution.
88 /// \param masterRecordNums
89 /// Records of all observations assigned by the master distribution to the calling process.
90 std::shared_ptr<Distribution> createReplicaDistribution(
91  const eckit::mpi::Comm & comm,
92  std::shared_ptr<const Distribution> master,
93  const std::vector<std::size_t> &masterRecordNums);
94 
95 } // namespace ioda
96 
97 #endif // DISTRIBUTION_DISTRIBUTIONUTILS_H_
class for distributing obs across multiple process elements
std::size_t globalNumNonMissingObs(const Distribution &dist, size_t numVariables, const std::vector< double > &v)
Counts unique non-missing observations in a vector.
double dotProduct(const Distribution &dist, std::size_t numVariables, const std::vector< double > &v1, const std::vector< double > &v2)
std::size_t globalNumNonMissingObs(const Distribution &dist, std::size_t numVariables, const std::vector< double > &v)
std::shared_ptr< Distribution > createReplicaDistribution(const eckit::mpi::Comm &comm, std::shared_ptr< const Distribution > master, const std::vector< std::size_t > &masterRecordNums)
Create a suitable replica distribution for the distribution master.