www/dox/invcg1__array_8cc_source.html

 /*! \file

  *  \brief Conjugate-Gradient algorithm for a generic Linear Operator

  */


 #include "chromabase.h"

 #include "actions/ferm/invert/invcg1_array.h"


 using namespace QDP::Hints;


 namespace Chroma {


 //! Conjugate-Gradient (CGNE) algorithm for a generic Linear Operator

 /*! \ingroup invert

  * This subroutine uses the Conjugate Gradient (CG) algorithm to find

  * the solution of the set of linear equations

  *

  *          Chi  =  A . Psi

  *

  * where       A is hermitian

  *

  * Algorithm:


  *  Psi[0]  :=  initial guess;                 Linear interpolation (argument)

  *  r[0]    :=  Chi - M^dag . M . Psi[0] ;     Initial residual

  *  p[1]    :=  r[0] ;                         Initial direction

  *  IF |r[0]| <= RsdCG |Chi| THEN RETURN;      Converged?

  *  FOR k FROM 1 TO MaxCG DO                   CG iterations

  *      a[k] := |r[k-1]|**2 / <Mp[k],Mp[k]> ;

  *      Psi[k] += a[k] p[k] ;                  New solution std::vector

  *      r[k] -= a[k] M^dag . M . p[k] ;        New residual

  *      IF |r[k]| <= RsdCG |Chi| THEN RETURN;  Converged?

  *      b[k+1] := |r[k]|**2 / |r[k-1]|**2 ;

  *      p[k+1] := r[k] + b[k+1] p[k];          New direction

  *

  * Arguments:

  *

  *  \param M       Linear Operator             (Read)

  *  \param chi     Source                      (Read)

  *  \param psi     Solution                    (Modify)

  *  \param RsdCG   CG residual accuracy        (Read)

  *  \param MaxCG   Maximum CG iterations       (Read)

  *  \param n_count Number of CG iteration      (Write)

  *

  * Local Variables:

  *

  *  p                  Direction std::vector

  *  r                  Residual std::vector

  *  cp                 | r[k] |**2

  *  c                  | r[k-1] |**2

  *  k                  CG iteration counter

  *  a                  a[k]

  *  b                  b[k+1]

  *  d                  < p[k], A.p[k] >

  *  Mp                 Temporary for  M.p

  *

  * Subroutines:

  *                             +

  *  A       Apply matrix M or M  to std::vector

  *

  * Operations:

  *

  *  2 A + 2 Nc Ns + N_Count ( 2 A + 10 Nc Ns )

  */


 #undef PRINT_5D_RESID

 template<typename T>

 void InvCG1_a(const LinearOperatorArray<T>& A,

               const multi1d<T> & chi,

               multi1d<T>& psi,

               const Real& RsdCG,

               int MaxCG,

               int& n_count)

 {

   START_CODE();


   const int N = psi.size();

   const Subset& s = A.subset();


   multi1d<T> Ap(N);             moveToFastMemoryHint(Ap);


                                 moveToFastMemoryHint(psi,true);


   multi1d<T> r(N);              moveToFastMemoryHint(r);

   multi1d<T> p(N);              moveToFastMemoryHint(p);

   multi1d<T> chi_internal(N);   moveToFastMemoryHint(chi_internal);


   for(int i=0; i < N; i++) {

     chi_internal[i][s] = chi[i];

   }


   Real chi_sq =  Real(norm2(chi_internal,s));


   QDPIO::cout << "chi_norm = " << sqrt(chi_sq) << std::endl;

   Real rsd_sq = (RsdCG * RsdCG) * chi_sq;


   //

   //  r[0]  :=  Chi - A . Psi[0]    where  A is hermitian


   //

   //  r  :=  [ Chi  -  A. psi ]


   A(Ap, psi, PLUS);

   for(int n=0; n < N; ++n)

     r[n][s] = chi[n] - Ap[n];


 #ifdef PRINT_5D_RESID

   for(int n=0; n < N; n++) {

     Double norm_r = norm2(r[n],s);

     if( toBool( norm_r > Double(1.0e-20)) ) {

       QDPIO::cout << "Iteration 0  r[" << n << "] = " << norm_r << std::endl;

     }

   }

 #endif


   //  p[1]  :=  r[0]

   for(int n=0; n < N; ++n) {

     p[n][s] = r[n];

   }


   //  Cp = |r[0]|^2

   Double cp = norm2(r, s);                 /* 2 Nc Ns  flops */


   QDPIO::cout << "InvCG: k = 0  cp = " << cp << "  rsd_sq = " << rsd_sq << std::endl;


   //  IF |r[0]| <= RsdCG |Chi| THEN RETURN;

   if ( toBool(cp  <=  rsd_sq) )

   {

     n_count = 0;

     revertFromFastMemoryHint(psi,true);

     END_CODE();

     return;

   }


   //

   //  FOR k FROM 1 TO MaxCG DO

   //

   Real a, b;

   Double c, d;


   for(int k = 1; k <= MaxCG; ++k)

   {

     //  c  =  | r[k-1] |**2

     c = cp;


     //  a[k] := | r[k-1] |**2 / < p[k], Ap[k] > ;

     //

     //  First compute  d  =  < p, A.p >

     //  Mp = M(u) * p


     A(Ap, p, PLUS);


     //  d = | mp | ** 2

     d = innerProductReal(p, Ap, s);     /* 2 Nc Ns  flops */


     a = Real(c)/Real(d);


     //  Psi[k] += a[k] p[k]

     for(int n=0; n < N; ++n) {

       psi[n][s] += a * p[n];    /* 2 Nc Ns  flops */

     }


     //  r[k] -= a[k] A . p[k] ;

     //

     for(int n=0; n < N; ++n) {

       r[n][s] -= a * Ap[n];

     }


 #ifdef PRINT_5D_RESID

     for(int n=0; n < N; n++) {

       Double norm_r = norm2(r[n],s);

       if( toBool( norm_r > Double(1.0e-20)) )

         QDPIO::cout << "Iteration " << k << " r[" << n << "] = " << norm_r << std::endl;

     }

 #endif


     //  IF |r[k]| <= RsdCG |Chi| THEN RETURN;


     //  cp  =  | r[k] |**2

     cp = norm2(r, s);                   /* 2 Nc Ns  flops */


     QDPIO::cout << "InvCG: k = " << k << "  cp = " << cp << std::endl;


     if ( toBool(cp  <=  rsd_sq) )

     {

       n_count = k;

       revertFromFastMemoryHint(psi,true);

       END_CODE();

       return;

     }


     //  b[k+1] := |r[k]|**2 / |r[k-1]|**2

     b = Real(cp) / Real(c);

 #if 1

     QDPIO::cout << "InvCGev: k = " << k << "  alpha = " << a << "  beta = " << b << std::endl;

 #endif


     //  p[k+1] := r[k] + b[k+1] p[k]

     for(int n=0; n < N; ++n)

       p[n][s] = r[n] + b*p[n];  /* Nc Ns  flops */

   }

   n_count = MaxCG;

   QDPIO::cerr << "Nonconvergence Warning" << std::endl;

   revertFromFastMemoryHint(psi,true);

   END_CODE();

   return;


 }


 // Fix here for now

 template<>

 void InvCG1(const LinearOperatorArray<LatticeFermion>& A,

             const multi1d<LatticeFermion>& chi,

             multi1d<LatticeFermion>& psi,

             const Real& RsdCG,

             int MaxCG,

             int& n_count)

 {

   InvCG1_a(A, chi, psi, RsdCG, MaxCG, n_count);

 }


 }  // end namespace Chroma

chromabase.h
Primary include file for CHROMA library code.

END_CODE
#define END_CODE()
Definition: chromabase.h:65

START_CODE
#define START_CODE()
Definition: chromabase.h:64

Chroma::LinearOperatorArray
Linear Operator to arrays.
Definition: linearop.h:61

MaxCG
EXTERN int MaxCG
Definition: common_declarations.h:15

Chroma::InvCG1
void InvCG1(const LinearOperatorArray< LatticeFermion > &A, const multi1d< LatticeFermion > &chi, multi1d< LatticeFermion > &psi, const Real &RsdCG, int MaxCG, int &n_count)
Conjugate-Gradient (CGNE) algorithm for a generic Linear Operator.
Definition: invcg1_array.cc:216

Chroma::InvCG1_a
void InvCG1_a(const LinearOperatorArray< T > &A, const multi1d< T > &chi, multi1d< T > &psi, const Real &RsdCG, int MaxCG, int &n_count)
Conjugate-Gradient (CGNE) algorithm for a generic Linear Operator.
Definition: invcg1_array.cc:67

invcg1_array.h
Conjugate-Gradient algorithm for a generic Linear Operator.

s
unsigned s
Definition: ldumul_w.cc:37

i
unsigned i
Definition: ldumul_w.cc:34

n
unsigned n
Definition: ldumul_w.cc:36

c
int c
Definition: meslate.cc:61

Chroma
Asqtad Staggered-Dirac operator.
Definition: klein_gord.cc:10

Chroma::RsdCG
const WilsonTypeFermAct< multi1d< LatticeFermion > > Handle< const ConnectState > const multi1d< Real > enum InvType invType const multi1d< Real > & RsdCG
Definition: pbg5p_w.cc:30

Chroma::p
p
Definition: invbicg.cc:157

Chroma::rsd_sq
Real rsd_sq
Definition: invbicg.cc:121

Chroma::PLUS
@ PLUS
Definition: chromabase.h:45

Chroma::cp
Double cp
Definition: invbicg.cc:107

Chroma::a
Complex a
Definition: invbicg.cc:95

Chroma::d
DComplex d
Definition: invbicg.cc:99

Chroma::A
A(A, psi, r, Ncb, PLUS)

Chroma::b
Complex b
Definition: invbicg.cc:96

Chroma::k
int k
Definition: invbicg.cc:119

testing::internal::Double
FloatingPoint< double > Double
Definition: gtest.h:7351

r
multi1d< LatticeFermion > r(Ncb)

chi
chi
Definition: pade_trln_w.cc:24

psi
psi
Definition: pade_trln_w.cc:191

n_count
int n_count
Definition: pade_trln_w.cc:69