1.0/oops/_d_r_i_p_c_g_minimizer_8h_source.html

/*

 * (C) Copyright 2009-2016 ECMWF.

 *

 * This software is licensed under the terms of the Apache Licence Version 2.0

 * which can be obtained at http://www.apache.org/licenses/LICENSE-2.0.

 * In applying this licence, ECMWF does not waive the privileges and immunities

 * granted to it by virtue of its status as an intergovernmental organisation nor

 * does it submit to any jurisdiction.

 */


#ifndef OOPS_ASSIMILATION_DRIPCGMINIMIZER_H_

#define OOPS_ASSIMILATION_DRIPCGMINIMIZER_H_


#include <cmath>

#include <string>

#include <vector>


#include "oops/assimilation/BMatrix.h"

#include "oops/assimilation/ControlIncrement.h"

#include "oops/assimilation/CostFunction.h"

#include "oops/assimilation/DRMinimizer.h"

#include "oops/assimilation/HtRinvHMatrix.h"

#include "oops/assimilation/QNewtonLMP.h"

#include "oops/util/dot_product.h"

#include "oops/util/formats.h"

#include "oops/util/Logger.h"


namespace oops {


/// Derber-Rosati IPCG Minimizer

/*!

 * \brief Derber-Rosati Inexact-Preconditioned Conjugate Gradients solver.

 *

 * This solver is based on the Golub-Ye Inexact-Preconditioned Conjugate

 * Gradients solver for Ax=b (G.H. Golub and Q. Ye 1999/00,

 * SIAM J. Sci. Comput. 21(4) 1305-1320), and on the Derber and Rosati double

 * PCG algorithm (J. Derber and A. Rosati, 1989, J. Phys. Oceanog. 1333-1347).

 * It solves \f$ Ax=b\f$ for the particular case \f$ A=B^{-1}+C\f$,

 * without requiring the application of \f$ B^{-1}\f$.

 *

 * A must be square, symmetric, positive definite.

 *

 * A preconditioner must be supplied that, given a vector q, returns an

 * approximation to \f$ (AB)^{-1} q\f$. The preconditioner can be variable.

 * Note that the traditional \f$ B\f$-preconditioning corresponds to

 * precond=\f$I\f$.

 *

 * On entry:

 * -    x       =  starting point, \f$ X_0 \f$.

 * -    xh      = \f$ B^{-1} x_0\f$.

 * -    b       = right hand side.

 * -    B       = \f$ B \f$.

 * -    C       = \f$ C \f$.

 * -    precond = preconditioner \f$ F_k \approx (AB)^{-1} \f$.

 *

 * On exit, x will contain the solution \f$ x \f$ and xh will contain

 * \f$ B^{-1} x\f$.

 *  The return value is the achieved reduction in residual norm.

 *

 *  Iteration will stop if the maximum iteration limit "maxiter" is reached

 *  or if the residual norm reduces by a factor of "tolerance".

 *

 *  Each of BMATRIX, CMATRIX and PMATRIX must implement a method:

 *  - void multiply(const VECTOR&, VECTOR&) const

 *

 *  which applies the matrix to the first argument, and returns the

 *  matrix-vector product in the second. (Note: the const is optonal, but

 *  recommended.)

 */


// -----------------------------------------------------------------------------


template<typename MODEL, typename OBS> class DRIPCGMinimizer : public DRMinimizer<MODEL, OBS> {

  typedef BMatrix<MODEL, OBS>             Bmat_;

  typedef CostFunction<MODEL, OBS>        CostFct_;

  typedef ControlIncrement<MODEL, OBS>    CtrlInc_;

  typedef HtRinvHMatrix<MODEL, OBS>       HtRinvH_;


 public:

  const std::string classname() const override {return "DRIPCGMinimizer";}

  DRIPCGMinimizer(const eckit::Configuration &, const CostFct_ &);

  ~DRIPCGMinimizer() {}


 private:

  double solve(CtrlInc_ &, CtrlInc_ &, CtrlInc_ &, const Bmat_ &, const HtRinvH_ &,

               const double, const double, const int, const double) override;


  QNewtonLMP<CtrlInc_, Bmat_> lmp_;

};


// =============================================================================


template<typename MODEL, typename OBS>

DRIPCGMinimizer<MODEL, OBS>::DRIPCGMinimizer(const eckit::Configuration & conf, const CostFct_ & J)

  : DRMinimizer<MODEL, OBS>(J), lmp_(conf)

{}


// -----------------------------------------------------------------------------


template<typename MODEL, typename OBS>

double DRIPCGMinimizer<MODEL, OBS>::solve(CtrlInc_ & xx, CtrlInc_ & xh, CtrlInc_ & rr,

                                    const Bmat_ & B, const HtRinvH_ & HtRinvH,

                                    const double costJ0Jb, const double costJ0JoJc,

                                    const int maxiter, const double tolerance) {

  CtrlInc_ ap(xh);

  CtrlInc_ pp(xh);

  CtrlInc_ ph(xh);

  CtrlInc_ ss(xh);

  CtrlInc_ sh(xh);

  CtrlInc_ dr(xh);

  CtrlInc_ r0(xh);


  std::vector<CtrlInc_> vvecs;  // for re-orthogonalization

  std::vector<CtrlInc_> zvecs;  // for re-orthogonalization

  std::vector<double> scals;  // for re-orthogonalization

  // reserve space in vectors to avoid extra copies

  vvecs.reserve(maxiter+1);

  zvecs.reserve(maxiter+1);

  scals.reserve(maxiter+1);


  const double costJ0 = costJ0Jb + costJ0JoJc;


  r0 = rr;


  lmp_.multiply(rr, sh);

  B.multiply(sh, ss);


  double dotRr0  = dot_product(rr, rr);

  double dotSr0  = dot_product(rr, ss);

  double normReduction = 1.0;

  double rdots = dotSr0;

  double rdots_old = dotSr0;


  vvecs.push_back(rr);

  zvecs.push_back(ss);

  scals.push_back(1.0/dotSr0);


  Log::info() << std::endl;

  for (int jiter = 0; jiter < maxiter; ++jiter) {

    Log::info() << " DRIPCG Starting Iteration " << jiter+1 << std::endl;


    if (jiter == 0) {

      pp = ss;

      ph = sh;

    } else {

      dr -= rr;  // dr=oldr-r

      double beta = -dot_product(ss, dr)/rdots_old;


      pp *= beta;

      pp += ss;      // p = s + beta*p


      ph *= beta;

      ph += sh;      // ph = sh + beta*ph

    }


    HtRinvH.multiply(pp, ap);

    ap += ph;


    dr = rr;


    double rho = dot_product(pp, ap);

    double alpha = rdots/rho;

    Log::info() << "DRIPCGMinimizer rho = " << rho << ", alpha = " << alpha << std::endl;


    xx.axpy(alpha, pp);   // xx = xx + alpha*pp

    xh.axpy(alpha, ph);   // xh = xh + alpha*ph

    rr.axpy(-alpha, ap);  // rr = rr - alpha*ap


    // Compute the quadratic cost function

    double costJ = costJ0 - 0.5 * dot_product(xx, r0);

    double costJb = costJ0Jb + 0.5 * dot_product(xx, xh);

    double costJoJc = costJ - costJb;


    // Re-orthogonalization

    for (int jj = 0; jj < jiter; ++jj) {

      double proj = scals[jj] * dot_product(rr, zvecs[jj]);

      rr.axpy(-proj, vvecs[jj]);

    }


    lmp_.multiply(rr, sh);

    B.multiply(sh, ss);


    rdots_old = rdots;

    rdots = dot_product(rr, ss);

//  There is an issue where in some cases ss goes to zero before rr. The convergence

//  check below only checks for rr. Leaving the commented lines here for further invertigation.

//  double sdots = dot_product(ss, ss);

//  double rdotr = dot_product(rr, rr);

//  Log::info() << "DRIPCGMinimizer rdots = " << rdots

//              << ", sdots = " << sdots << ", rdotr = " << rdotr << std::endl;

    normReduction = sqrt(dot_product(rr, rr)/dotRr0);


    Log::info() << "DRIPCG end of iteration " << jiter+1 << ". Norm reduction= "

                << util::full_precision(normReduction) << std::endl

                << "  Quadratic cost function: J   (" <<  jiter+1 << ") = "

                << util::full_precision(costJ)         << std::endl

                << "  Quadratic cost function: Jb  (" <<  jiter+1 << ") = "

                << util::full_precision(costJb)        << std::endl

                << "  Quadratic cost function: JoJc(" << jiter+1 << ") = "

                << util::full_precision(costJoJc)      << std::endl << std::endl;


    // Save the pairs for preconditioning

    lmp_.push(pp, ph, ap, rho);


    if (normReduction < tolerance) {

      Log::info() << "DRIPCG: Achieved required reduction in residual norm." << std::endl;

      break;

    }


    vvecs.push_back(rr);

    zvecs.push_back(ss);

    scals.push_back(1.0/rdots);

  }


// Generate the (second-level) Limited Memory Preconditioner

  lmp_.update(B);


  return normReduction;

}


// -----------------------------------------------------------------------------


}  // namespace oops


#endif  // OOPS_ASSIMILATION_DRIPCGMINIMIZER_H_