doxygen-example/_q_newton_l_m_p_8h_source.html

 /*
  * (C) Copyright 2009-2016 ECMWF.
  *
  * This software is licensed under the terms of the Apache Licence Version 2.0
  * which can be obtained at http://www.apache.org/licenses/LICENSE-2.0.
  * In applying this licence, ECMWF does not waive the privileges and immunities
  * granted to it by virtue of its status as an intergovernmental organisation nor
  * does it submit to any jurisdiction.
  */

 #ifndef OOPS_ASSIMILATION_QNEWTONLMP_H_
 #define OOPS_ASSIMILATION_QNEWTONLMP_H_

 #include <algorithm>
 #include <string>
 #include <vector>

 #include "eckit/config/LocalConfiguration.h"
 #include "oops/util/dot_product.h"
 #include "oops/util/Logger.h"

 #include <boost/scoped_ptr.hpp>

 namespace oops {

   /*  The QUASI-NEWTON  Limited Memory preconditioner matrix \f$ C \f$
    *  for the system matrix \f$ AB = (I + Ht Rinv H B) \f$
    *
    *  It is defined as
    *  \f$ C_(k+1)  = (I - rho_k ph_k q_k^T) C_k  (I - rho_k q_k p_k^T) + rho_k ph_k p_k^T\f$
    *
    *  For details, we refer to S. Gratton, A. Sartenaer and J. Tshimanga,
    *  SIAM J. Optim.,21(3),912–935,2011 and S. Gurol, PhD Manuscript, 2013.
    *
    *  The solvers represent matrices as objects that implement a "multiply"
    *  method. This class defines objects that apply the preconditioner matrix \f$ P \f$.
    */

 // -----------------------------------------------------------------------------

 template<typename VECTOR, typename BMATRIX> class QNewtonLMP {
  public:
   explicit QNewtonLMP(const eckit::Configuration &);
   ~QNewtonLMP() {}

   void push(const VECTOR &, const VECTOR &, const VECTOR &, const double &);
   void update(const BMATRIX & B);

   void multiply(const VECTOR &, VECTOR &) const;

   // Matrix-vector products with the transpose of the preconditioner
   void tmultiply(const VECTOR &, VECTOR &) const;

  private:
   unsigned maxpairs_;
   unsigned maxnewpairs_;
   bool useoldpairs_;
   int maxouter_;
   int update_;

   std::vector<VECTOR> P_;
   std::vector<VECTOR> Ph_;
   std::vector<VECTOR> AP_;
   std::vector<VECTOR> BAP_;
   std::vector<double> rhos_;
   std::vector<unsigned> usedpairIndx_;

   std::vector<VECTOR> savedP_;
   std::vector<VECTOR> savedPh_;
   std::vector<VECTOR> savedAP_;
   std::vector<double> savedrhos_;
 };

 // =============================================================================

 template<typename VECTOR, typename BMATRIX>
 QNewtonLMP<VECTOR, BMATRIX>::QNewtonLMP(const eckit::Configuration & conf)
   : maxpairs_(0), maxnewpairs_(0), useoldpairs_(false), maxouter_(0), update_(1)
 {
   maxouter_ = conf.getInt("nouter");
   Log::info() << "QNewtonLMP: maxouter : " << maxouter_ << std::endl;

   if (conf.has("preconditioner")) {
     const eckit::LocalConfiguration precond(conf, "preconditioner");
     if (precond.has("maxpairs")) maxpairs_ = precond.getInt("maxpairs");
     if (maxpairs_ > 0) {
       std::string old;
       if (precond.has("useoldpairs")) old = precond.getString("useoldpairs");
       useoldpairs_ = (old == "on" || old == "true");
       if (useoldpairs_ && precond.has("maxnewpairs")) {
           maxnewpairs_ = precond.getInt("maxnewpairs");
           maxnewpairs_ = std::min(maxpairs_, maxnewpairs_);
       } else {
        maxnewpairs_ = maxpairs_;
       }
     }
   }
 }

 // -----------------------------------------------------------------------------

 template<typename VECTOR, typename BMATRIX>
 void QNewtonLMP<VECTOR, BMATRIX>::push(const VECTOR & p, const VECTOR & ph,
                                        const VECTOR & ap, const double & rho) {
   ASSERT(savedP_.size() <= maxnewpairs_);
   if (maxnewpairs_ > 0 && update_ < maxouter_) {
     if (savedP_.size() == maxnewpairs_) {
       savedP_.erase(savedP_.begin());
       savedPh_.erase(savedPh_.begin());
       savedAP_.erase(savedAP_.begin());
       savedrhos_.erase(savedrhos_.begin());
     }
     savedP_.push_back(p);
     savedPh_.push_back(ph);
     savedAP_.push_back(ap);
     savedrhos_.push_back(1.0/rho);
   }
 }

 // -----------------------------------------------------------------------------

 template<typename VECTOR, typename BMATRIX>
 void QNewtonLMP<VECTOR, BMATRIX>::update(const BMATRIX & Bmat) {
   Log::debug() << "QNewtonLMP size saved Ph    = " << savedPh_.size() << std::endl;
   Log::debug() << "QNewtonLMP size saved P     = " << savedP_.size() << std::endl;
   Log::debug() << "QNewtonLMP size saved AP    = " << savedAP_.size() << std::endl;
   Log::debug() << "QNewtonLMP size saved rhos  = " << savedrhos_.size() << std::endl;

   const unsigned nvec = savedPh_.size();
   ASSERT(savedP_.size() == nvec);
   ASSERT(savedAP_.size() == nvec);
   ASSERT(savedrhos_.size() == nvec);

   if (!useoldpairs_ || nvec >= maxpairs_) {
     Ph_.clear();
     P_.clear();
     AP_.clear();
     BAP_.clear();
     rhos_.clear();
     for (unsigned kiter = 0; kiter < usedpairIndx_.size(); ++kiter) {
       usedpairIndx_[kiter] = 0;
     }
   }

   if (nvec > 0 && update_ < maxouter_) {
     Log::info() << "QNewtonLMP: update " << update_ << ", max = " << maxouter_-1 << std::endl;
     unsigned newpairs = std::min(nvec, maxpairs_);
     unsigned oldpairs = P_.size();
     unsigned rmpairs = 0;
 //  First remove pairs we no longer need.
     if (oldpairs + newpairs > maxpairs_) {
       rmpairs = oldpairs + newpairs - maxpairs_;
       for (unsigned jv = 0; jv < rmpairs; ++jv) {
         Ph_.erase(Ph_.begin());
         P_.erase(P_.begin());
         AP_.erase(AP_.begin());
         BAP_.erase(BAP_.begin());
         rhos_.erase(rhos_.begin());
       }
       oldpairs -= rmpairs;
 //    Keep information on how many pairs are used at each minimization loop
       unsigned removed = rmpairs;
       for (unsigned kiter = 0; kiter < usedpairIndx_.size(); ++kiter) {
         unsigned rmiter = std::min(usedpairIndx_[kiter], removed);
         usedpairIndx_[kiter] -= rmiter;
         removed -= rmiter;
       }
       ASSERT(removed == 0);
     }
     ASSERT(P_.size() == oldpairs);
     ASSERT(oldpairs + newpairs <= maxpairs_);

 //  Add the new pairs.
     for (unsigned jv = nvec - newpairs; jv < nvec; ++jv) {
       P_.push_back(savedP_[jv]);
       Ph_.push_back(savedPh_[jv]);
       AP_.push_back(savedAP_[jv]);
       rhos_.push_back(savedrhos_[jv]);
       // Save B*ap
       VECTOR ww(savedAP_[jv]);
       Bmat.multiply(savedAP_[jv], ww);
       BAP_.push_back(ww);
     }
     ASSERT(P_.size() == oldpairs + newpairs);

     Log::info() << "Number of inner iterations       : " << nvec << std::endl;
     Log::info() << "Number of maximum pairs          : " << maxpairs_ << std::endl;
     Log::info() << "Number of used total pairs       : " << oldpairs + newpairs << std::endl;
     Log::info() << "Number of new pairs              : " << newpairs << std::endl;
     Log::info() << "Number of removed old pairs      : " << rmpairs << std::endl;
     for (unsigned kiter = 0; kiter < usedpairIndx_.size(); ++kiter) {
       Log::info() << "Number of used pairs from outer loop " << kiter + 1
                 << " : "                                   << usedpairIndx_[kiter];
     }
   }

   ++update_;
   savedP_.clear();
   savedPh_.clear();
   savedAP_.clear();
   savedrhos_.clear();
 }

 // -----------------------------------------------------------------------------

 template<typename VECTOR, typename BMATRIX>
 void QNewtonLMP<VECTOR, BMATRIX>::multiply(const VECTOR & a, VECTOR & b) const {
   b = a;
   const unsigned nvec = P_.size();
   if (nvec != 0) {
     std::vector<double> etas;
     etas.clear();
     for (int iiter = nvec-1; iiter >= 0; iiter--) {
       double eta = dot_product(b, P_[iiter]);
       eta *= rhos_[iiter];
       etas.push_back(eta);
       b.axpy(-eta, AP_[iiter]);
     }
     b *= dot_product(AP_[nvec-1], AP_[nvec-1])/dot_product(AP_[nvec-1], Ph_[nvec-1]);
     for (unsigned iiter = 0; iiter < nvec; ++iiter) {
       double sigma = dot_product(b, BAP_[iiter]);
       sigma *= rhos_[iiter];
       sigma -= etas[iiter];
       b.axpy(-sigma, Ph_[iiter]);
     }
   }
 }

 // -----------------------------------------------------------------------------

 template<typename VECTOR, typename BMATRIX>
 void QNewtonLMP<VECTOR, BMATRIX>::tmultiply(const VECTOR & a, VECTOR & b) const {
   b = a;
   const unsigned nvec = P_.size();
   if (nvec != 0) {
     std::vector<double> etas;
     etas.clear();
     for (int iiter = nvec-1; iiter >= 0; iiter--) {
       double eta = dot_product(b, Ph_[iiter]);
       eta *= rhos_[iiter];
       etas.push_back(eta);
       b.axpy(-eta, BAP_[iiter]);
     }
     b *= dot_product(AP_[nvec-1], AP_[nvec-1])/dot_product(AP_[nvec-1], Ph_[nvec-1]);
     for (unsigned iiter = 0; iiter < nvec; ++iiter) {
       double sigma = dot_product(b, AP_[iiter]);
       sigma *= rhos_[iiter];
       sigma -= etas[iiter];
       b.axpy(-sigma, P_[iiter]);
     }
   }
 }

 // -----------------------------------------------------------------------------

 }  // namespace oops

 #endif  // OOPS_ASSIMILATION_QNEWTONLMP_H_
oops::QNewtonLMP::push
void push(const VECTOR &, const VECTOR &, const VECTOR &, const double &)
Definition: QNewtonLMP.h:103

oops::QNewtonLMP::rhos_
std::vector< double > rhos_
Definition: QNewtonLMP.h:65

oops::QNewtonLMP::BAP_
std::vector< VECTOR > BAP_
Definition: QNewtonLMP.h:64

oops::QNewtonLMP::update
void update(const BMATRIX &B)
Definition: QNewtonLMP.h:123

oops::QNewtonLMP::P_
std::vector< VECTOR > P_
Definition: QNewtonLMP.h:61

conf
Definition: conf.py:1

gsw_mod_check_data::rho
type(gsw_result) rho
Definition: gsw_mod_check_data.f90:2723

oops::QNewtonLMP::maxnewpairs_
unsigned maxnewpairs_
Definition: QNewtonLMP.h:56

oops::QNewtonLMP::QNewtonLMP
QNewtonLMP(const eckit::Configuration &)
Definition: QNewtonLMP.h:77

interpolator_mod::sigma
integer, parameter sigma
Flags to indicate where climatology pressure levels are pressure or sigma levels. ...
Definition: interpolator.F90:344

gsw_mod_check_data::p
real(r8), dimension(cast_m, cast_n) p
Definition: gsw_mod_check_data.f90:247

binary_file_utility::false
integer(long), parameter false
Definition: Binary_File_Utility.f90:60

oops::QNewtonLMP::maxpairs_
unsigned maxpairs_
Definition: QNewtonLMP.h:55

oops::QNewtonLMP::tmultiply
void tmultiply(const VECTOR &, VECTOR &) const
Definition: QNewtonLMP.h:232

oops
The namespace for the main oops code.
Definition: ErrorCovarianceFV3JEDI.h:24

mpp_mod::debug
logical debug
Definition: mpp.F90:1297

oops::QNewtonLMP::multiply
void multiply(const VECTOR &, VECTOR &) const
Definition: QNewtonLMP.h:207

oops::QNewtonLMP::savedP_
std::vector< VECTOR > savedP_
Definition: QNewtonLMP.h:68

oops::QNewtonLMP::savedAP_
std::vector< VECTOR > savedAP_
Definition: QNewtonLMP.h:70

fv3jedi_varcha_c2m_mod::multiply
subroutine, public multiply(self, geom, xctl, xmod)
Definition: fv3jedi_varcha_c2m_mod.f90:114

oops::QNewtonLMP::AP_
std::vector< VECTOR > AP_
Definition: QNewtonLMP.h:63

fv3jedi_geom_mod::info
subroutine, public info(self)
Definition: fv3jedi_geom_mod.f90:494

gsw_mod_freezing_poly_coefficients::b
real(r8), parameter b
Definition: gsw_mod_freezing_poly_coefficients.f90:35

oops::QNewtonLMP::savedrhos_
std::vector< double > savedrhos_
Definition: QNewtonLMP.h:71

oops::QNewtonLMP::update_
int update_
Definition: QNewtonLMP.h:59

oops::QNewtonLMP::maxouter_
int maxouter_
Definition: QNewtonLMP.h:58

tools_asa007::eta
real(kind_real), parameter eta
Definition: tools_asa007.F90:21

oops::QNewtonLMP
Definition: QNewtonLMP.h:41

a
************************************************************************GNU Lesser General Public License **This file is part of the GFDL Flexible Modeling System(FMS). ! *! *FMS is free software without even the implied warranty of MERCHANTABILITY or *FITNESS FOR A PARTICULAR PURPOSE See the GNU General Public License *for more details **You should have received a copy of the GNU Lesser General Public *License along with FMS If see< http:! ***********************************************************************!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!! !! MPP_TRANSMIT !! !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!! subroutine MPP_TRANSMIT_(put_data, put_len, to_pe, get_data, get_len, from_pe, block, tag, recv_request, send_request)!a message-passing routine intended to be reminiscent equally of both MPI and SHMEM!put_data and get_data are contiguous MPP_TYPE_ arrays!at each call, your put_data array is put to to_pe 's get_data! your get_data array is got from from_pe 's put_data!i.e we assume that typically(e.g updating halo regions) each PE performs a put _and_ a get!special PE designations:! NULL_PE:to disable a put or a get(e.g at boundaries)! ANY_PE:if remote PE for the put or get is to be unspecific! ALL_PES:broadcast and collect operations(collect not yet implemented)!ideally we would not pass length, but this f77-style call performs better(arrays passed by address, not descriptor)!further, this permits< length > contiguous words from an array of any rank to be passed(avoiding f90 rank conformance check)!caller is responsible for completion checks(mpp_sync_self) before and after integer, intent(in) ::put_len, to_pe, get_len, from_pe MPP_TYPE_, intent(in) ::put_data(*) MPP_TYPE_, intent(out) ::get_data(*) logical, intent(in), optional ::block integer, intent(in), optional ::tag integer, intent(out), optional ::recv_request, send_request logical ::block_comm integer ::i MPP_TYPE_, allocatable, save ::local_data(:) !local copy used by non-parallel code(no SHMEM or MPI) integer ::comm_tag integer ::rsize if(.NOT.module_is_initialized) call mpp_error(FATAL, 'MPP_TRANSMIT:You must first call mpp_init.') if(to_pe.EQ.NULL_PE .AND. from_pe.EQ.NULL_PE) return block_comm=.true. if(PRESENT(block)) block_comm=block if(debug) then call SYSTEM_CLOCK(tick) write(stdout_unit,'(a, i18, a, i6, a, 2i6, 2i8)')&'T=', tick, ' PE=', pe, ' MPP_TRANSMIT begin:to_pe, from_pe, put_len, get_len=', to_pe, from_pe, put_len, get_len end if comm_tag=DEFAULT_TAG if(present(tag)) comm_tag=tag!do put first and then get if(to_pe.GE.0 .AND. to_pe.LT.npes) then!use non-blocking sends if(debug .and.(current_clock.NE.0)) call SYSTEM_CLOCK(start_tick)!z1l:truly non-blocking send.! if(request(to_pe).NE.MPI_REQUEST_NULL) then !only one message from pe-> to_pe in queue *PE waiting for to_pe ! call error else get_len so only do gets but you cannot have a pure get with MPI call a get means do a wait to ensure put on remote PE is complete error call increase mpp_nml request_multiply call MPP_TRANSMIT get_len end if return end subroutine MPP_TRANSMIT_ ! MPP_BROADCAST ! subroutine but that doesn t allow !broadcast to a subset of PEs This version and mpp_transmit will remain !backward compatible intent(inout) a
Definition: mpp_transmit_mpi.h:178

oops::QNewtonLMP::usedpairIndx_
std::vector< unsigned > usedpairIndx_
Definition: QNewtonLMP.h:66

oops::QNewtonLMP::~QNewtonLMP
~QNewtonLMP()
Definition: QNewtonLMP.h:44

min
#define min(a, b)
Definition: mosaic_util.h:32

oops::QNewtonLMP::Ph_
std::vector< VECTOR > Ph_
Definition: QNewtonLMP.h:62

oops::QNewtonLMP::savedPh_
std::vector< VECTOR > savedPh_
Definition: QNewtonLMP.h:69

oops::QNewtonLMP::useoldpairs_
bool useoldpairs_
Definition: QNewtonLMP.h:57