www/dox/invmr_8cc_source.html

 /*! \file

  *  \brief Minimal-Residual (MR) for a generic fermion Linear Operator

  */


 #include "chromabase.h"

 #include "actions/ferm/invert/invmr.h"


 using namespace QDP::Hints;


 namespace Chroma

 {


   //! Minimal-residual (MR) algorithm for a generic Linear Operator

   /*! \ingroup invert

    * This subroutine uses the Minimal Residual (MR) algorithm to determine

    * the solution of the set of linear equations. Here we allow M to be nonhermitian.

    *

    *        Chi  =  M . Psi

    *

    * Algorithm:

    *

    *  Psi[0]                                      Argument

    *  r[0]    :=  Chi  -  M . Psi[0] ;            Initial residual

    *  IF |r[0]| <= RsdCG |Chi| THEN RETURN;       Converged?

    *  FOR k FROM 1 TO MaxCG DO                    MR iterations

    *      a[k-1]  := <M.r[k-1],r[k-1]> / <M.r[k-1],M.r[k-1]> ;

    *      ap[k-1] := MRovpar * a[k] ;             Overrelaxtion step

    *      Psi[k]  += ap[k-1] r[k-1] ;                   New solution std::vector

    *      r[k]    -= ap[k-1] A . r[k-1] ;         New residual

    *      IF |r[k]| <= RsdCG |Chi| THEN RETURN;   Converged?


    * Arguments:


    *  \param M       Linear Operator             (Read)

    *  \param chi     Source                      (Read)

    *  \param psi     Solution                    (Modify)

    *  \param RsdCG   MR residual accuracy        (Read)

    *  \param MRovpar Overrelaxation parameter    (Read)

    *  \param MaxMR   Maximum MR iterations       (Read)


    * Local Variables:


    *  r         Residual std::vector

    *  cp        | r[k] |**2

    *  c         | r[k-1] |**2

    *  k         MR iteration counter

    *  a         a[k]

    *  d         < M.r[k], M.r[k] >

    *  R_Aux     Temporary for  M.Psi

    *  Mr        Temporary for  M.r


    * Global Variables:


    *  MaxMR       Maximum number of MR iterations allowed

    *  RsdCG       Maximum acceptable MR residual (relative to source)

    *

    * Subroutines:

    *

    *  M           Apply matrix to std::vector

    *

    * @{

    */


   template<typename T, typename C>

   SystemSolverResults_t

   InvMR_a(const C& M,

           const T& chi,

           T& psi,

           const Real& MRovpar,

           const Real& RsdMR,

           int MaxMR,

           enum PlusMinus isign)

   {

     START_CODE();


     const Subset& s = M.subset();


     SystemSolverResults_t  res;

     moveToFastMemoryHint(psi,true);

     T Mr;                moveToFastMemoryHint(Mr);

     T chi_internal;      moveToFastMemoryHint(chi_internal);


     chi_internal[s] = chi;


     Complex a;

     DComplex c;

     Double d;

     int k;


     QDPIO::cout << "InvMR: starting" << std::endl;

     FlopCounter flopcount;

     flopcount.reset();

     StopWatch swatch;

     swatch.reset();

     swatch.start();


     Real rsd_sq = (RsdMR * RsdMR) * Real(norm2(chi_internal,s));

     flopcount.addSiteFlops(4*Nc*Ns,s);


     /*  r[0]  :=  Chi - M . Psi[0] */

     /*  r  :=  M . Psi  */

     M(Mr, psi, isign);

     flopcount.addFlops(M.nFlops());


     T r;                moveToFastMemoryHint(r);

     r[s] = chi_internal - Mr;

     flopcount.addSiteFlops(2*Nc*Ns,s);


     /*  Cp = |r[0]|^2 */

     Double cp = norm2(r, s);                 /* 2 Nc Ns  flops */

     flopcount.addSiteFlops(4*Nc*Ns, s);


 //  QDPIO::cout << "InvMR: k = 0  cp = " << cp << "  rsd_sq = " << rsd_sq << std::endl;


     /*  IF |r[0]| <= RsdMR |Chi| THEN RETURN; */

     if ( toBool(cp  <=  rsd_sq) )

     {

       res.n_count = 0;

       res.resid   = sqrt(cp);

       swatch.stop();

       flopcount.report("invMR", swatch.getTimeInSeconds());

       revertFromFastMemoryHint(psi,true);

       END_CODE();

       return res;

     }


     /*  FOR k FROM 1 TO MaxMR DO */

     k = 0;

     while( (k < MaxMR) && (toBool(cp > rsd_sq)) )

     {

       ++k;


       /*  a[k-1] := < M.r[k-1], r[k-1] >/ < M.r[k-1], M.r[k-1] > ; */

       /*  Mr = M * r  */

       M(Mr, r, isign);  flopcount.addFlops(M.nFlops());


       /*  c = < M.r, r > */

       c = innerProduct(Mr, r, s);  flopcount.addSiteFlops(4*Nc*Ns,s);


       /*  d = | M.r | ** 2  */

       d = norm2(Mr, s);  flopcount.addSiteFlops(4*Nc*Ns,s);


       /*  a = c / d */

       a = c / d;


       /*  a[k-1] *= MRovpar ; */

       a = a * MRovpar;


       /*  Psi[k] += a[k-1] r[k-1] ; */

       psi[s] += r * a;    flopcount.addSiteFlops(4*Nc*Ns,s);


       /*  r[k] -= a[k-1] M . r[k-1] ; */

       r[s] -= Mr * a;    flopcount.addSiteFlops(4*Nc*Ns,s);


       /*  cp  =  | r[k] |**2 */

       cp = norm2(r, s);    flopcount.addSiteFlops(4*Nc*Ns,s);


 //    QDPIO::cout << "InvMR: k = " << k << "  cp = " << cp << std::endl;

     }

     res.n_count = k;

     res.resid   = sqrt(cp);

     swatch.stop();

     QDPIO::cout << "InvMR: k = " << k << "  cp = " << cp << std::endl;

     flopcount.report("invmr", swatch.getTimeInSeconds());

     revertFromFastMemoryHint(psi,true);


     // Compute the actual residual

     {

       M(Mr, psi, isign);

       Double actual_res = norm2(chi_internal - Mr,s);

       res.resid = sqrt(actual_res);

     }


     if ( res.n_count == MaxMR )

       QDPIO::cerr << "Nonconvergence Warning" << std::endl;


     END_CODE();

     return res;

   }


   // Fix here for now

   template<>

   SystemSolverResults_t

   InvMR(const LinearOperator<LatticeFermion>& M,

         const LatticeFermion& chi,

         LatticeFermion& psi,

         const Real& MRovpar,

         const Real& RsdMR,

         int MaxMR,

         enum PlusMinus isign)

   {

     return InvMR_a(M, chi, psi, MRovpar, RsdMR, MaxMR, isign);

   }


   // Fix here for now

   template<>

   SystemSolverResults_t

   InvMR(const LinearOperator<LatticeStaggeredFermion>& M,

         const LatticeStaggeredFermion& chi,

         LatticeStaggeredFermion& psi,

         const Real& MRovpar,

         const Real& RsdMR,

         int MaxMR,

         enum PlusMinus isign)

   {

     return InvMR_a(M, chi, psi, MRovpar, RsdMR, MaxMR, isign);

   }


   /*! @} */  // end of group invert


 }  // end namespace Chroma

chromabase.h
Primary include file for CHROMA library code.

END_CODE
#define END_CODE()
Definition: chromabase.h:65

START_CODE
#define START_CODE()
Definition: chromabase.h:64

Chroma::LinearOperator< LatticeFermion >

Chroma::InvMR
SystemSolverResults_t InvMR(const LinearOperator< LatticeStaggeredFermion > &M, const LatticeStaggeredFermion &chi, LatticeStaggeredFermion &psi, const Real &MRovpar, const Real &RsdMR, int MaxMR, enum PlusMinus isign)
Definition: invmr.cc:200

Chroma::InvMR_a
SystemSolverResults_t InvMR_a(const C &M, const T &chi, T &psi, const Real &MRovpar, const Real &RsdMR, int MaxMR, enum PlusMinus isign)
Minimal-residual (MR) algorithm for a generic Linear Operator.
Definition: invmr.cc:66

invmr.h
Minimal-Residual (MR) for a generic fermion Linear Operator.

s
unsigned s
Definition: ldumul_w.cc:37

c
int c
Definition: meslate.cc:61

Chroma::BaryonSpinMats::C
SpinMatrix C()
C = Gamma(10)
Definition: barspinmat_w.cc:29

Chroma::InlinePropAndMatElemDistillation2Env::local::innerProduct
BinaryReturn< C1, C2, FnInnerProduct >::Type_t innerProduct(const QDPSubType< T1, C1 > &s1, const QDPType< T2, C2 > &s2)
Definition: inline_prop_and_matelem_distillation2_w.cc:463

Chroma
Asqtad Staggered-Dirac operator.
Definition: klein_gord.cc:10

Chroma::T
LinOpSysSolverMGProtoClover::T T
Definition: syssolver_linop_clover_mg_proto.cc:63

Chroma::rsd_sq
Real rsd_sq
Definition: invbicg.cc:121

Chroma::PlusMinus
PlusMinus
Definition: chromabase.h:45

Chroma::cp
Double cp
Definition: invbicg.cc:107

Chroma::a
Complex a
Definition: invbicg.cc:95

Chroma::d
DComplex d
Definition: invbicg.cc:99

Chroma::k
int k
Definition: invbicg.cc:119

Chroma::isign
isign
Definition: pbg5p_w.cc:58

testing::internal::Double
FloatingPoint< double > Double
Definition: gtest.h:7351

RsdMR
RsdMR
Definition: pade_trln_w.cc:26

r
multi1d< LatticeFermion > r(Ncb)

chi
chi
Definition: pade_trln_w.cc:24

psi
psi
Definition: pade_trln_w.cc:191

Chroma::SystemSolverResults_t
Holds return info from SystemSolver call.
Definition: syssolver.h:17

Chroma::SystemSolverResults_t::n_count
int n_count
Definition: syssolver.h:20

Chroma::SystemSolverResults_t::resid
Real resid
Definition: syssolver.h:21