www/dox/inv__eigcg2_8cc_source.html

 // -*- C++ -*-

 /*! \file

  *  \brief Conjugate-Gradient algorithm with eigenstd::vector acceleration

  */


 #include <qdp-lapack.h>

 //#include "octave_debug.h"

 //#include "octave_debug.cc"


 #include "actions/ferm/invert/inv_eigcg2.h"


 #include "actions/ferm/invert/containers.h"

 #include "actions/ferm/invert/norm_gram_schm.h"


 //#define DEBUG

 #define DEBUG_FINAL


 // NEEDS A LOT OF CLEAN UP

 namespace Chroma

 {

   using namespace LinAlg ;

   //using namespace Octave ;


   namespace InvEigCG2Env

   {

     // needs a little clean up... for possible exceptions if the size of H

     // is smaller than hind

     // LatticeFermionF

     template<typename T>

     void SubSpaceMatrix_T(LinAlg::Matrix<DComplex>& H,

                           const LinearOperator<T>& A,

                           const multi1d<T>& evec,

                           int Nvecs)

     {

       H.N = Nvecs ;

       if(Nvecs>evec.size()){

         H.N = evec.size();

       }

       if(H.N>H.size()){

         QDPIO::cerr<<"OOPS! your matrix can't take this many matrix elements\n";

         exit(1);

       }

       // fill H  with zeros

       H.mat = 0.0 ;


       T Ap;

       for(int i(0);i<H.N;i++)

       {

         A(Ap,evec[i],PLUS) ;

         for(int j(i);j<H.N;j++)

         {

           H(j,i) = innerProduct(evec[j], Ap, A.subset()) ;

           //enforce hermiticity

           H(i,j) = conj(H(j,i));

           if(i==j) H(i,j) = real(H(i,j));

         }

       }

     }


     template<typename T>

     void SubSpaceMatrix_T(LinAlg::Matrix<DComplex>& H,

                           const LinearOperator<T>& A,

                           const multi1d<T>& evec,

                           const multi1d<Double>& eval,

                           int Nvecs,int NgoodEvecs)

     {

       H.N = Nvecs ;

       if(Nvecs>evec.size()){

         H.N = evec.size();

       }

       if(H.N>H.size()){

         QDPIO::cerr<<"OOPS! your matrix can't take this many matrix elements\n";

         exit(1);

       }

       // fill H  with zeros

       H.mat = 0.0 ;


       for(int i(0);i<NgoodEvecs;i++)

         H(i,i) = eval(i);


       T Ap;

       for(int i(NgoodEvecs);i<H.N;i++)

       {

         A(Ap,evec[i],PLUS) ;

         for(int j(0);j<H.N;j++)

         {

           H(j,i) = innerProduct(evec[j], Ap, A.subset()) ;

           //enforce hermiticity

           H(i,j) = conj(H(j,i));

           if(i==j) H(i,j) = real(H(i,j));

         }

       }

     }


     //The new code

     template<typename T>

     SystemSolverResults_t new_InvEigCG2_T(const LinearOperator<T>& A,

                                           T& x,

                                           const T& b,

                                           multi1d<Double>& eval,

                                           multi1d<T>& evec,

                                           int Neig,

                                           int Nmax,

                                           const Real& RsdCG, int MaxCG,

                                           const int PrintLevel)

     {

       START_CODE();


       FlopCounter flopcount;

       flopcount.reset();

       StopWatch swatch;

       swatch.reset();

       swatch.start();


       SystemSolverResults_t  res;


       T p ;

       T Ap;

       T r ;

       //T z ;


       Double rsd_sq = (RsdCG * RsdCG) * Real(norm2(b,A.subset()));

       Double alphaprev, alpha,pAp;

       Real beta;

       Double betaprev  ;

       Double r_dot_z, r_dot_z_old ;


       int k = 0 ;

       A(Ap,x,PLUS) ;

       r[A.subset()] = b - Ap ;

       r_dot_z = norm2(r,A.subset()) ;


 #if 1

       QDPIO::cout << "InvEigCG2: Nevecs(input) = " << evec.size() << std::endl;

       QDPIO::cout << "InvEigCG2: k = " << k << "  res^2 = " << r_dot_z << std::endl;

 #endif

       Matrix<DComplex> H(Nmax) ; // square matrix containing the tridiagonal

       Vectors<T> vec(Nmax) ; // contains the vectors we use...


       beta=0.0;

       alpha = 1.0;

       T Ap_prev ;

       T tt ;


       // Algorithm from page 529 of Golub and Van Loan

       // Modified to match the m-code from A. Stathopoulos

       while(toBool(r_dot_z>rsd_sq)){

         /** preconditioning algorithm **/

         //z[A.subset()]=r ; //preconditioning can be added here

         //r_dot_z = innerProductReal(r,z,A.subset());

         //****//

         r_dot_z_old = r_dot_z ;

         r_dot_z = norm2(r,A.subset());

         Double inv_sqrt_r_dot_z = 1.0/sqrt(r_dot_z) ;

         k++ ;

         if(k==1){

           //p[A.subset()] = z ;

           p[A.subset()] = r ;

         }

         else{

           betaprev = beta ;

           beta = r_dot_z/r_dot_z_old ;

           //p[A.subset()] = z + beta*p ;

           p[A.subset()] = r + beta*p ;

         }

         //-------- Eigenvalue eigenstd::vector finding code ------

         if((Neig>0)&& (H.N == Nmax)) Ap_prev[A.subset()]=Ap ;

         //---------------------------------------------------

         A(Ap,p,PLUS) ;


         //-------- Eigenvalue eigenstd::vector finding code ------

         if(Neig>0){

           if(k>1)

             H(H.N-1,H.N-1) = 1/alpha + betaprev/alphaprev;

           if(vec.N==Nmax){

             QDPIO::cout<<"MAGIC BEGINS: H.N ="<<H.N<<std::endl ;

 #ifdef DEBUG

 #ifndef QDP_IS_QDPJIT

             {

               std::stringstream tag ;

               tag<<"H"<<k ;

               OctavePrintOut(H.mat,Nmax,tag.str(),"Hmatrix.m");

             }

             {

               Matrix<DComplex> tmp(Nmax) ;

               SubSpaceMatrix(tmp,A,vec.vec,vec.N);

               std::stringstream tag ;

               tag<<"H"<<k<<"ex" ;

               OctavePrintOut(tmp.mat,Nmax,tag.str(),"Hmatrix.m");

             }

 #endif

 #endif

             multi2d<DComplex> Hevecs(H.mat) ;

             multi1d<Double> Heval ;

             char V = 'V' ; char U = 'U' ;

             QDPLapack::zheev(V,U,Nmax,Hevecs,Heval);

 #ifdef DEBUG

 #ifndef QDP_IS_QDPJIT

             {

               std::stringstream tag ;

               tag<<"Hevecs"<<k ;

               OctavePrintOut(Hevecs,Nmax,tag.str(),"Hmatrix.m");

             }

             for(int i(0);i<Nmax;i++)

               QDPIO::cout<<" eignvalue: "<<Heval[i]<<std::endl ;

 #endif

 #endif

             multi2d<DComplex> Hevecs_old(H.mat) ;

             multi1d<Double> Heval_old ;

             QDPLapack::zheev(V,U,Nmax-1,Hevecs_old,Heval_old);

             for(int i(0);i<Nmax;i++)

               Hevecs_old(i,Nmax-1) = Hevecs_old(Nmax-1,i) = 0.0 ;


             //Reduce to 2*Neig vectors

             H.N = Neig + Neig ; // Thickness of restart 2*Neig


             for(int i(Neig);i<2*Neig;i++)

               for(int j(0);j<Nmax;j++)

                 Hevecs(i,j) = Hevecs_old(i-Neig,j) ;


             // Orthogonalize the last Neig vecs (keep the first Neig fixed)

             // zgeqrf(Nmax, 2*Neig, Hevecs, Nmax,

             //  TAU_CMPLX_ofsize_2Neig, Workarr, 2*Neig*Lapackblocksize, info);

             multi1d<DComplex> TAU ;

             QDPLapack::zgeqrf(Nmax,2*Neig,Hevecs,TAU) ;

             char R = 'R' ; char L = 'L' ; char N ='N' ; char C = 'C' ;

             multi2d<DComplex> Htmp = H.mat ;

             QDPLapack::zunmqr(R,N,Nmax,Nmax,Hevecs,TAU,Htmp);

             QDPLapack::zunmqr(L,C,Nmax,2*Neig,Hevecs,TAU,Htmp);


             QDPLapack::zheev(V,U,2*Neig,Htmp,Heval);

 #ifdef DEBUG

 #ifndef QDP_IS_QDPJIT

             {

               std::stringstream tag ;

               tag<<"Htmp"<<k ;

               OctavePrintOut(Htmp,Nmax,tag.str(),"Hmatrix.m");

             }

 #endif

 #endif

             for(int i(Neig); i< 2*Neig;i++ ) // mhpws prepei na einai 0..2*Neig

               for(int j(2*Neig); j<Nmax; j++)

                 Htmp(i,j) =0.0;


 #ifdef DEBUG

 #ifndef QDP_IS_QDPJIT

             {

               std::stringstream tag ;

               tag<<"HtmpBeforeZUM"<<k ;

               OctavePrintOut(Htmp,Nmax,tag.str(),"Hmatrix.m");

             }

 #endif

 #endif

             QDPLapack::zunmqr(L,N,Nmax,2*Neig,Hevecs,TAU,Htmp);

 #ifdef DEBUG

 #ifndef QDP_IS_QDPJIT

             {

               std::stringstream tag ;

               tag<<"HtmpAfeterZUM"<<k ;

               OctavePrintOut(Htmp,Nmax,tag.str(),"Hmatrix.m");

             }

 #endif

 #endif


 #ifndef USE_BLAS_FOR_LATTICEFERMIONS

             multi1d<T> tt_vec(2*Neig);

             for(int i(0);i<2*Neig;i++){

               tt_vec[i][A.subset()] = zero ;

               for(int j(0);j<Nmax;j++)

                 tt_vec[i][A.subset()] +=Htmp(i,j)*vec[j] ;

             }

             for(int i(0);i<2*Neig;i++)

               vec[i][A.subset()] = tt_vec[i] ;

 #else

             // Here I need the restart_X bit

             // zgemm("N", "N", Ns*Nc*Vol/2, 2*Neig, Nmax, 1.0,

             //      vec.vec, Ns*Nc*Vol, Htmp, Nmax+1, 0.0, tt_vec, Ns*Nc*Vol);

             // copy apo tt_vec se vec.vec


 #endif

             vec.N = 2*Neig ; // restart the vectors to keep


             H.mat = 0.0 ; // zero out H

             for (int i=0;i<2*Neig;i++) H(i,i) = Heval[i];


             //A(tt,r,PLUS) ;

             tt[A.subset()] = Ap - beta*Ap_prev ; //avoid the matvec


 #ifndef USE_BLAS_FOR_LATTICEFERMIONS

             for (int i=0;i<2*Neig;i++){

               H(2*Neig,i)=innerProduct(vec[i],tt,A.subset())*inv_sqrt_r_dot_z ;

               H(i,2*Neig)=conj(H(2*Neig,i)) ;

             //H(i,2*Neig)=innerProduct(vec[i],tt,A.subset())*inv_sqrt_r_dot_z ;

             //H(2*Neig,i)=conj(H(i,2*Neig)) ;

             }

 #else

             // Optimized code for creating the H matrix row and column

             // asume even-odd layout: Can I check if this is the case at

             // compile time? or even at run time? This is a good test to

             // have to avoid wrong results.


 #endif

           }//H.N==Nmax

           else{

             if(k>1)

               H(H.N-1,H.N) = H(H.N,H.N-1) = -sqrt(beta)/alpha;

           }

           H.N++ ;

           //vec.NormalizeAndAddVector(z,inv_sqrt_r_dot_z,A.subset()) ;

           vec.NormalizeAndAddVector(r,inv_sqrt_r_dot_z,A.subset()) ;

         }


         pAp = innerProductReal(p,Ap,A.subset());

         alphaprev = alpha ;// additional line for Eigenvalue eigenstd::vector code

         alpha = r_dot_z/pAp ;

         x[A.subset()] += alpha*p ;

         r[A.subset()] -= alpha*Ap ;


         //---------------------------------------------------

         if(k>MaxCG){

           res.n_count = k;

           res.resid   = sqrt(r_dot_z);

           QDP_error_exit("too many CG iterations: count = %d", res.n_count);

           END_CODE();

           return res;

         }

 #if 1

         QDPIO::cout << "InvEigCG2: k = " << k  ;

         QDPIO::cout << "  r_dot_z = " << r_dot_z << std::endl;

 #endif

       }//end CG loop


       if(Neig>0){

         evec.resize(Neig) ;

         eval.resize(Neig);


 #define  USE_LAST_VECTORS

 #ifdef USE_LAST_VECTORS


         multi2d<DComplex> Hevecs(H.mat) ;

         multi1d<Double> Heval ;

         char V = 'V' ; char U = 'U' ;

         QDPLapack::zheev(V,U,H.N-1,Hevecs,Heval);


         for(int i(0);i<Neig;i++){

           evec[i][A.subset()] = zero ;

           eval[i] = Heval[i] ;

           for(int j(0);j<H.N-1;j++)

             evec[i][A.subset()] +=Hevecs(i,j)*vec[j] ;

         }

 #else

         for(int i(0);i<Neig;i++){

           evec[i][A.subset()] = vec[i] ;

           eval[i] = real(H(i,i)) ;

         }

 #endif

       }

       res.n_count = k ;

       res.resid = sqrt(r_dot_z);

       swatch.stop();

       QDPIO::cout << "InvEigCG2: k = " << k << std::endl;

       flopcount.report("InvEigCG2", swatch.getTimeInSeconds());

       END_CODE();

       return res;

     }


     template<typename T>

     SystemSolverResults_t InvEigCG2_T(const LinearOperator<T>& A,

                                       T& x,

                                       const T& b,

                                       multi1d<Double>& eval,

                                       multi1d<T>& evec,

                                       int Neig,

                                       int Nmax,

                                       const Real& RsdCG, int MaxCG,

                                       const int PrintLevel)

     {

       START_CODE();


       char V = 'V' ; char U = 'U' ;


       FlopCounter flopcount;

       flopcount.reset();

       StopWatch swatch;

       swatch.reset();

       swatch.start();


       SystemSolverResults_t  res;


       T p ;

       T Ap;

       T r,z ;


       Double rsd_sq = (RsdCG * RsdCG) * Real(norm2(b,A.subset()));

       Double alphaprev, alpha,pAp;

       Real beta ;

       Double r_dot_z, r_dot_z_old ;

       //Complex r_dot_z, r_dot_z_old,beta ;

       //Complex alpha,pAp ;


       int k = 0 ;

       A(Ap,x,PLUS) ;

       r[A.subset()] = b - Ap ;

       Double r_norm2 = norm2(r,A.subset()) ;


       if(PrintLevel>0)

         QDPIO::cout << "InvEigCG2: Nevecs(input) = " << evec.size() << std::endl;

       if(PrintLevel>1)

         QDPIO::cout << "InvEigCG2: k = " << k << "  res^2 = "<<r_norm2<<std::endl;


       Real inorm(Real(1.0/sqrt(r_norm2)));

       bool FindEvals = (Neig>0);

       int tr; // Don't know what this does...

       bool from_restart;

       Matrix<DComplex> H(Nmax) ; // square matrix containing the tridiagonal

       Vectors<T> vec(Nmax) ; // contains the vectors we use...

       //-------- Eigenvalue eigenstd::vector finding code ------

       vec.AddVectors(evec,A.subset()) ;

       //QDPIO::cout<<"vec.N="<<vec.N<<std::endl ;

       p[A.subset()] = inorm*r ; // this is not needed GramSchmidt will take care of it

       vec.AddOrReplaceVector(p,A.subset());

       //QDPIO::cout<<"vec.N="<<vec.N<<std::endl ;

       normGramSchmidt(vec.vec,vec.N-1,vec.N,A.subset());

       normGramSchmidt(vec.vec,vec.N-1,vec.N,A.subset()); //call twice: need to improve...

       SubSpaceMatrix(H,A,vec.vec,vec.N);

       from_restart = true ;

       tr = H.N - 1; // this is just a flag as far as I can tell

       //-------


       Double betaprev ;

       beta=0.0;

       alpha = 1.0;

       // Algorithm from page 529 of Golub and Van Loan

       // Modified to match the m-code from A. Stathopoulos

       while(toBool(r_norm2>rsd_sq)){

         /** preconditioning algorithm **

         z[A.subset()]=r ; //preconditioning can be added here

         r_dot_z = innerProductReal(r,z,A.subset());

         **/

         r_dot_z = innerProductReal(r,r,A.subset());

         k++ ;

         betaprev = beta; // additional line for Eigenvalue eigenstd::vector code

         if(k==1){

           //p[A.subset()] = z ;

           p[A.subset()] = r ;

           H.N++ ;

         }

         else{

           beta = r_dot_z/r_dot_z_old ;

           //p[A.subset()] = z + beta*p ;

           p[A.subset()] = r + beta*p ;

           //-------- Eigenvalue eigenstd::vector finding code ------

           // fist block

           if(FindEvals){

             if(!((from_restart)&&(H.N == tr+1))){

               if(!from_restart){

                 H(H.N-2,H.N-2) = 1/alpha + betaprev/alphaprev;

               }

               from_restart = false ;

               H(H.N-1,H.N-2) = -sqrt(beta)/alpha;

               H(H.N-2,H.N-1) = -sqrt(beta)/alpha;

             }

             H.N++ ;

           }

           //---------------------------------------------------

         }

         A(Ap,p,PLUS) ;

         pAp = innerProductReal(p,Ap,A.subset());


         alphaprev = alpha ;// additional line for Eigenvalue eigenstd::vector code

         alpha = r_dot_z/pAp ;

         x[A.subset()] += alpha*p ;

         r[A.subset()] -= alpha*Ap ;

         r_norm2 =  norm2(r,A.subset()) ;

         r_dot_z_old = r_dot_z ;


         //-------- Eigenvalue eigenstd::vector finding code ------

         // second block

         if(FindEvals){

           if (vec.N==Nmax){//we already have stored the maximum number of vectors

             // The magic begins here....

             if(PrintLevel>0)

               QDPIO::cout<<"MAGIC BEGINS: H.N ="<<H.N<<std::endl ;

             H(Nmax-1,Nmax-1) = 1/alpha + beta/alphaprev;


             multi2d<DComplex> Hevecs(H.mat) ;

             multi1d<Double> Heval ;

             QDPLapack::zheev(V,U,Hevecs,Heval);

             multi2d<DComplex> Hevecs_old(H.mat) ;


             multi1d<Double> Heval_old ;

             QDPLapack::zheev(V,U,Nmax-1,Hevecs_old,Heval_old);

             for(int i(0);i<Nmax;i++)


             tr = Neig + Neig ; // v_old = Neig optimal choice


             for(int i(Neig);i<tr;i++)

               for(int j(0);j<Nmax;j++)

                 Hevecs(i,j) = Hevecs_old(i-Neig,j) ;


             // Orthogonalize the last Neig vecs (keep the first Neig fixed)

             // zgeqrf(Nmax, 2*Neig, Hevecs, Nmax,

             //  TAU_CMPLX_ofsize_2Neig, Workarr, 2*Neig*Lapackblocksize, info);

             multi1d<DComplex> TAU ;

             QDPLapack::zgeqrf(Nmax,2*Neig,Hevecs,TAU) ;

             char R = 'R' ; char L = 'L' ; char N ='N' ; char C = 'C' ;

             multi2d<DComplex> Htmp = H.mat ;

             QDPLapack::zunmqr(R,N,Nmax,Nmax,Hevecs,TAU,Htmp);

             QDPLapack::zunmqr(L,C,Nmax,2*Neig,Hevecs,TAU,Htmp);

             // Notice that now H is of size 2Neig x 2Neig,

             // but still with LDA = Nmax


             QDPLapack::zheev(V,U,2*Neig,Htmp,Heval);

             for(int i(Neig); i< 2*Neig;i++ )

               for(int j(2*Neig); j<Nmax; j++)

                 Htmp(i,j) =0.0;


             QDPLapack::zunmqr(L,N,Nmax,2*Neig,Hevecs,TAU,Htmp);


             // Here I need the restart_X bit

             multi1d<T> tt_vec = vec.vec;

             for(int i(0);i<2*Neig;i++){

               vec[i][A.subset()] = zero ;

               for(int j(0);j<Nmax;j++)

                 vec[i][A.subset()] +=Htmp(i,j)*tt_vec[j] ; // NEED TO CHECK THE INDEXING

             }


             H.mat = 0.0 ; // zero out H

             for (int i=0;i<2*Neig;i++) H(i,i) = Heval[i];


             T Ar ;

             // Need to reorganize so that we aboid this extra matvec

             A(Ar,r,PLUS) ;

             Ar /= sqrt(r_norm2);

             // this has the oposite convension than the subspace matrix

             // this is the reason the std::vector reconstruction in here does not

             // need the conj(H) while in the Rayleigh Ritz refinement

             // it does need it.

             // In here the only complex matrix elements are these computined

             // in the next few lines. This is why the inconsistency

             //  does not matter anywhere else.

             // In the refinement step though all matrix elements are complex

             // hence things break down.

             // Need to fix the convension so that we do not

             // have these inconsistencies.

             for (int i=0;i<2*Neig;i++){

               H(2*Neig,i) = innerProduct(vec[i], Ar, A.subset()) ;

               H(i,2*Neig) = conj(H(2*Neig,i)) ;

             }

             H(2*Neig,2*Neig) = innerProduct(r, Ar, A.subset())/sqrt(r_norm2) ;


             H.N = 2*Neig + 1  ; // why this ?

             from_restart = true ;

             vec.N = 2*Neig ; // only keep the lowest Neig. Is this correct???


           }

           // Here we add a std::vector in the list

           Double inorm = 1.0/sqrt(r_norm2) ;

           vec.NormalizeAndAddVector(r,inorm,A.subset()) ;

           // Shouldn't be the z std::vector when a preconditioner is used?

         }

         //---------------------------------------------------


         if(k>MaxCG){

           res.n_count = k;

           res.resid   = sqrt(r_norm2);

           QDP_error_exit("too many CG iterations: count = %d", res.n_count);

           END_CODE();

           return res;

         }

         if(PrintLevel>1){

           QDPIO::cout << "InvEigCG2: k = " << k << "  res^2 = " << r_norm2 ;

           QDPIO::cout << "  r_dot_z = " << r_dot_z << std::endl;

         }

       }

       res.n_count = k ;

       res.resid = sqrt(r_norm2);

       if(FindEvals)

       {

         // Evec Code ------ Before we return --------

         // vs is the current number of vectors stored

         // Neig is the number of eigenstd::vector we want to compute

         normGramSchmidt(vec.vec,0,2*Neig,A.subset());

         normGramSchmidt(vec.vec,0,2*Neig,A.subset());

         Matrix<DComplex> Htmp(2*Neig) ;

         SubSpaceMatrix(Htmp,A,vec.vec,2*Neig);


         //char V = 'V' ; char U = 'U' ;

         multi1d<Double> tt_eval ;

         QDPLapack::zheev(V,U,Htmp.mat,tt_eval);

         evec.resize(Neig) ;

         eval.resize(Neig);

         for(int i(0);i<Neig;i++){

           evec[i][A.subset()] = zero ;

           eval[i] = tt_eval[i] ;

           for(int j(0);j<2*Neig;j++)

             evec[i][A.subset()] += Htmp(i,j)*vec[j] ;

         }


         // I will do the checking of eigenstd::vector quality outside this routine

         // -------------------------------------------

         if(PrintLevel>3){

           // CHECK IF vec are eigenvectors...

           T Av ;

           for(int i(0);i<Neig;i++){

             A(Av,evec[i],PLUS) ;

             DComplex rq = innerProduct(evec[i],Av,A.subset());

             Av[A.subset()] -= eval[i]*evec[i] ;

             Double tt = sqrt(norm2(Av,A.subset()));

             QDPIO::cout<<"FINAL: error eigenstd::vector["<<i<<"] = "<<tt<<" " ;

             tt =  sqrt(norm2(evec[i],A.subset()));

             QDPIO::cout<<"--- rq ="<<real(rq)<<" ";

             QDPIO::cout<<"--- norm = "<<tt<<std::endl  ;

           }

         }

       }


       res.n_count = k;

       res.resid   = sqrt(r_norm2);

       swatch.stop();

       QDPIO::cout << "InvEigCG2: k = " << k << std::endl;

       flopcount.report("InvEigCG2", swatch.getTimeInSeconds());

       END_CODE();

       return res;

     }


 #if 0

     //The old code

     template<typename T>

     SystemSolverResults_t InvEigCG2_T(const LinearOperator<T>& A,

                                       T& x,

                                       const T& b,

                                       multi1d<Double>& eval,

                                       multi1d<T>& evec,

                                       int Neig,

                                       int Nmax,

                                       const Real& RsdCG, int MaxCG)

     {

       START_CODE();


       FlopCounter flopcount;

       flopcount.reset();

       StopWatch swatch;

       swatch.reset();

       swatch.start();


       SystemSolverResults_t  res;


       T p ;

       T Ap;

       T r,z ;


       Double rsd_sq = (RsdCG * RsdCG) * Real(norm2(b,A.subset()));

       Double alphaprev, alpha,pAp;

       Real beta ;

       Double r_dot_z, r_dot_z_old ;

       //Complex r_dot_z, r_dot_z_old,beta ;

       //Complex alpha,pAp ;


       int k = 0 ;

       A(Ap,x,PLUS) ;

       r[A.subset()] = b - Ap ;

       Double r_norm2 = norm2(r,A.subset()) ;


 #if 1

       QDPIO::cout << "InvEigCG2: Nevecs(input) = " << evec.size() << std::endl;

       QDPIO::cout << "InvEigCG2: k = " << k << "  res^2 = " << r_norm2 << std::endl;

 #endif

       Real inorm(Real(1.0/sqrt(r_norm2)));

       bool FindEvals = (Neig>0);

       int tr; // Don't know what this does...

       bool from_restart;

       Matrix<DComplex> H(Nmax) ; // square matrix containing the tridiagonal

       Vectors<T> vec(Nmax) ; // contains the vectors we use...

       //-------- Eigenvalue eigenstd::vector finding code ------

       vec.AddVectors(evec,A.subset()) ;

       //QDPIO::cout<<"vec.N="<<vec.N<<std::endl ;

       p[A.subset()] = inorm*r ; // this is not needed GramSchmidt will take care of it

       vec.AddOrReplaceVector(p,A.subset());

       //QDPIO::cout<<"vec.N="<<vec.N<<std::endl ;

       normGramSchmidt(vec.vec,vec.N-1,vec.N,A.subset());

       normGramSchmidt(vec.vec,vec.N-1,vec.N,A.subset()); //call twice: need to improve...

       SubSpaceMatrix(H,A,vec.vec,vec.N);

       from_restart = true ;

       tr = H.N - 1; // this is just a flag as far as I can tell

       //-------


       Double betaprev ;

       beta=0.0;

       alpha = 1.0;

       // Algorithm from page 529 of Golub and Van Loan

       // Modified to match the m-code from A. Stathopoulos

       while(toBool(r_norm2>rsd_sq)){

         /** preconditioning algorithm **/

         z[A.subset()]=r ; //preconditioning can be added here

         /**/

         r_dot_z = innerProductReal(r,z,A.subset());

         k++ ;

         betaprev = beta; // additional line for Eigenvalue eigenstd::vector code

         if(k==1){

           p[A.subset()] = z ;

           H.N++ ;

         }

         else{

           beta = r_dot_z/r_dot_z_old ;

           p[A.subset()] = z + beta*p ;

           //-------- Eigenvalue eigenstd::vector finding code ------

           // fist block

           if(FindEvals){

             if(!((from_restart)&&(H.N == tr+1))){

               if(!from_restart){

                 H(H.N-2,H.N-2) = 1/alpha + betaprev/alphaprev;

               }

               from_restart = false ;

               H(H.N-1,H.N-2) = -sqrt(beta)/alpha;

               H(H.N-2,H.N-1) = -sqrt(beta)/alpha;

             }

             H.N++ ;

           }

           //---------------------------------------------------

         }

         A(Ap,p,PLUS) ;

         pAp = innerProductReal(p,Ap,A.subset());


         alphaprev = alpha ;// additional line for Eigenvalue eigenstd::vector code

         alpha = r_dot_z/pAp ;

         x[A.subset()] += alpha*p ;

         r[A.subset()] -= alpha*Ap ;

         r_norm2 =  norm2(r,A.subset()) ;

         r_dot_z_old = r_dot_z ;


         //-------- Eigenvalue eigenstd::vector finding code ------

         // second block

         if(FindEvals){

           if (vec.N==Nmax){//we already have stored the maximum number of vectors

             // The magic begins here....

             QDPIO::cout<<"MAGIC BEGINS: H.N ="<<H.N<<std::endl ;

             H(Nmax-1,Nmax-1) = 1/alpha + beta/alphaprev;


 #ifdef DEBUG

 #ifndef QDP_IS_QDPJIT

             {

               std::stringstream tag ;

               tag<<"H"<<k ;

               OctavePrintOut(H.mat,Nmax,tag.str(),"Hmatrix.m");

             }

             {

               Matrix<DComplex> tmp(Nmax) ;

               SubSpaceMatrix(tmp,A,vec.vec,vec.N);

               std::stringstream tag ;

               tag<<"H"<<k<<"ex" ;

               OctavePrintOut(tmp.mat,Nmax,tag.str(),"Hmatrix.m");

             }

 #endif

 #endif

             //exit(1);

             multi2d<DComplex> Hevecs(H.mat) ;

             multi1d<Double> Heval ;

             char V = 'V' ; char U = 'U' ;

             QDPLapack::zheev(V,U,Hevecs,Heval);

             multi2d<DComplex> Hevecs_old(H.mat) ;


 #ifdef DEBUG

             {

               multi1d<T> tt_vec(vec.size());

               for(int i(0);i<Nmax;i++){

                 tt_vec[i][A.subset()] = zero ;

                 for(int j(0);j<Nmax;j++)

                   tt_vec[i][A.subset()] +=Hevecs(i,j)*vec[j] ; // NEED TO CHECK THE INDEXINT

               }

               // CHECK IF vec are eigenvectors...


               T Av ;

               for(int i(0);i<Nmax;i++){

                 A(Av,tt_vec[i],PLUS) ;

                 DComplex rq = innerProduct(tt_vec[i],Av,A.subset());

                 Av[A.subset()] -= Heval[i]*tt_vec[i] ;

                 Double tt = sqrt(norm2(Av,A.subset()));

                 QDPIO::cout<<"1 error eigenstd::vector["<<i<<"] = "<<tt<<" " ;

                 tt =  sqrt(norm2(tt_vec[i],A.subset()));

                 QDPIO::cout<<" --- eval = "<<Heval[i]<<" ";

                 QDPIO::cout<<" --- rq = "<<real(rq)<<" ";

                 QDPIO::cout<<"--- norm = "<<tt<<std::endl  ;

               }

             }

 #endif

             multi1d<Double> Heval_old ;

             QDPLapack::zheev(V,U,Nmax-1,Hevecs_old,Heval_old);

             for(int i(0);i<Nmax;i++)

               Hevecs_old(i,Nmax-1) = Hevecs_old(Nmax-1,i) = 0.0 ;

 #ifdef DEBUG

 #ifndef QDP_IS_QDPJIT

             {

               std::stringstream tag ;

               tag<<"Hevecs_old"<<k ;

               OctavePrintOut(Hevecs_old,Nmax,tag.str(),"Hmatrix.m");

             }


 #endif

 #endif

             tr = Neig + Neig ; // v_old = Neig optimal choice


             for(int i(Neig);i<tr;i++)

               for(int j(0);j<Nmax;j++)

                 Hevecs(i,j) = Hevecs_old(i-Neig,j) ;

 #ifdef DEBUG

 #ifndef QDP_IS_QDPJIT

             {

               std::stringstream tag ;

               tag<<"Hevecs"<<k ;

               OctavePrintOut(Hevecs,Nmax,tag.str(),"Hmatrix.m");

             }

 #endif

 #endif


             // Orthogonalize the last Neig vecs (keep the first Neig fixed)

             // zgeqrf(Nmax, 2*Neig, Hevecs, Nmax,

             //    TAU_CMPLX_ofsize_2Neig, Workarr, 2*Neig*Lapackblocksize, info);

             multi1d<DComplex> TAU ;

             QDPLapack::zgeqrf(Nmax,2*Neig,Hevecs,TAU) ;

             char R = 'R' ; char L = 'L' ; char N ='N' ; char C = 'C' ;

             multi2d<DComplex> Htmp = H.mat ;

             QDPLapack::zunmqr(R,N,Nmax,Nmax,Hevecs,TAU,Htmp);

             QDPLapack::zunmqr(L,C,Nmax,2*Neig,Hevecs,TAU,Htmp);

             // Notice that now H is of size 2Neig x 2Neig,

             // but still with LDA = Nmax

 #ifdef DEBUG

 #ifndef QDP_IS_QDPJIT

             {

               std::stringstream tag ;

               tag<<"Htmp"<<k ;

               OctavePrintOut(Htmp,Nmax,tag.str(),"Hmatrix.m");

             }

 #endif

 #endif

             QDPLapack::zheev(V,U,2*Neig,Htmp,Heval);

             for(int i(Neig); i< 2*Neig;i++ )

               for(int j(2*Neig); j<Nmax; j++)

                 Htmp(i,j) =0.0;

 #ifdef DEBUG

 #ifndef QDP_IS_QDPJIT

             {

               std::stringstream tag ;

               tag<<"evecstmp"<<k ;

               OctavePrintOut(Htmp,Nmax,tag.str(),"Hmatrix.m");

             }

 #endif

 #endif

             QDPLapack::zunmqr(L,N,Nmax,2*Neig,Hevecs,TAU,Htmp);

 #ifdef DEBUG

 #ifndef QDP_IS_QDPJIT

             {

               std::stringstream tag ;

               tag<<"Yevecstmp"<<k ;

               OctavePrintOut(Htmp,Nmax,tag.str(),"Hmatrix.m");

             }

 #endif

 #endif

             // Here I need the restart_X bit

             multi1d<T> tt_vec = vec.vec;

             for(int i(0);i<2*Neig;i++){

               vec[i][A.subset()] = zero ;

               for(int j(0);j<Nmax;j++)

                 vec[i][A.subset()] +=Htmp(i,j)*tt_vec[j] ; // NEED TO CHECK THE INDEXING

             }


 #ifdef DEBUG

 #ifndef QDP_IS_QDPJIT

             // CHECK IF vec are eigenvectors...

             {

               T Av ;

               for(int i(0);i<2*Neig;i++){

                 A(Av,vec[i],PLUS) ;

                 DComplex rq = innerProduct(vec[i],Av,A.subset());

                 Av[A.subset()] -= Heval[i]*vec[i] ;

                 Double tt = sqrt(norm2(Av,A.subset()));

                 QDPIO::cout<<"error eigenstd::vector["<<i<<"] = "<<tt<<" " ;

                 tt =  sqrt(norm2(vec[i],A.subset()));

                 QDPIO::cout<<"--- rq ="<<real(rq)<<" ";

                 QDPIO::cout<<"--- norm = "<<tt<<std::endl  ;

               }


             }

 #endif

 #endif

             H.mat = 0.0 ; // zero out H

             for (int i=0;i<2*Neig;i++) H(i,i) = Heval[i];


             T Ar ;

             // Need to reorganize so that we aboid this extra matvec

             A(Ar,r,PLUS) ;

             Ar /= sqrt(r_norm2);

             // this has the oposite convension than the subspace matrix

             // this is the reason the std::vector reconstruction in here does not

             // need the conj(H) while in the Rayleigh Ritz refinement

             // it does need it.

             // In here the only complex matrix elements are these computined

             // in the next few lines. This is why the inconsistency

             //  does not matter anywhere else.

             // In the refinement step though all matrix elements are complex

             // hence things break down.

             // Need to fix the convension so that we do not

             // have these inconsistencies.

             for (int i=0;i<2*Neig;i++){

               H(2*Neig,i) = innerProduct(vec[i], Ar, A.subset()) ;

               H(i,2*Neig) = conj(H(2*Neig,i)) ;

             }

             H(2*Neig,2*Neig) = innerProduct(r, Ar, A.subset())/sqrt(r_norm2) ;


             H.N = 2*Neig + 1  ; // why this ?

             from_restart = true ;

             vec.N = 2*Neig ; // only keep the lowest Neig. Is this correct???

 #ifdef DEBUG

 #ifndef QDP_IS_QDPJIT

             {

               std::stringstream tag ;

               tag<<"finalH"<<k ;

               OctavePrintOut(H.mat,Nmax,tag.str(),"Hmatrix.m");

             }

 #endif

 #endif

           }

           // Here we add a std::vector in the list

           Double inorm = 1.0/sqrt(r_norm2) ;

           vec.NormalizeAndAddVector(r,inorm,A.subset()) ;

           // Shouldn't be the z std::vector when a preconditioner is used?

         }

         //---------------------------------------------------


         if(k>MaxCG){

           res.n_count = k;

           res.resid   = sqrt(r_norm2);

           QDP_error_exit("too many CG iterations: count = %d", res.n_count);

           END_CODE();

           return res;

         }

 #if 1

         QDPIO::cout << "InvEigCG2: k = " << k << "  res^2 = " << r_norm2 ;

         QDPIO::cout << "  r_dot_z = " << r_dot_z << std::endl;

 #endif

       }

       res.n_count = k ;

       res.resid = sqrt(r_norm2);

       if(FindEvals)

       {

         // Evec Code ------ Before we return --------

         // vs is the current number of vectors stored

         // Neig is the number of eigenstd::vector we want to compute

         normGramSchmidt(vec.vec,0,2*Neig,A.subset());

         normGramSchmidt(vec.vec,0,2*Neig,A.subset());

         Matrix<DComplex> Htmp(2*Neig) ;

         SubSpaceMatrix(Htmp,A,vec.vec,2*Neig);


         char V = 'V' ; char U = 'U' ;

         multi1d<Double> tt_eval ;

         QDPLapack::zheev(V,U,Htmp.mat,tt_eval);

         evec.resize(Neig) ;

         eval.resize(Neig);

         for(int i(0);i<Neig;i++){

           evec[i][A.subset()] = zero ;

           eval[i] = tt_eval[i] ;

           for(int j(0);j<2*Neig;j++)

             evec[i][A.subset()] += Htmp(i,j)*vec[j] ;

         }


         // I will do the checking of eigenstd::vector quality outside this routine

         // -------------------------------------------

 #ifdef DEBUG_FINAL

         // CHECK IF vec are eigenvectors...

         {

           T Av ;

           for(int i(0);i<Neig;i++)

           {

             A(Av,evec[i],PLUS) ;

             DComplex rq = innerProduct(evec[i],Av,A.subset());

             Av[A.subset()] -= eval[i]*evec[i] ;

             Double tt = sqrt(norm2(Av,A.subset()));

             QDPIO::cout<<"FINAL: error eigenstd::vector["<<i<<"] = "<<tt<<" " ;

             tt =  sqrt(norm2(evec[i],A.subset()));

             QDPIO::cout<<"--- rq ="<<real(rq)<<" ";

             QDPIO::cout<<"--- norm = "<<tt<<std::endl  ;

           }


         }

 #endif

       }


       res.n_count = k;

       res.resid   = sqrt(r_norm2);

       swatch.stop();

       QDPIO::cout << "InvEigCG2: k = " << k << std::endl;

       flopcount.report("InvEigCG2", swatch.getTimeInSeconds());

       END_CODE();

       return res;

     }


 #endif


     // A  should be Hermitian positive definite

     template<typename T>

     SystemSolverResults_t vecPrecondCG_T(const LinearOperator<T>& A,

                                          T& x,

                                          const T& b,

                                          const multi1d<Double>& eval,

                                          const multi1d<T>& evec,

                                          int startV, int endV,

                                          const Real& RsdCG, int MaxCG)

     {

       START_CODE();


       FlopCounter flopcount;

       flopcount.reset();

       StopWatch swatch;

       swatch.reset();

       swatch.start();


       if(endV>eval.size()){

         QDP_error_exit("vPrecondCG: not enought evecs eval.size()=%d",eval.size());

       }


       SystemSolverResults_t  res;


       T p ;

       T Ap;

       T r,z ;


       Double rsd_sq = (RsdCG * RsdCG) * Real(norm2(b,A.subset()));

       Double alpha,pAp;

       Real beta ;

       Double r_dot_z, r_dot_z_old ;

       //Complex r_dot_z, r_dot_z_old,beta ;

       //Complex alpha,pAp ;


       int k = 0 ;

       A(Ap,x,PLUS) ;

       r[A.subset()] = b - Ap ;

       Double r_norm2 = norm2(r,A.subset()) ;


 #if 1

       QDPIO::cout << "vecPrecondCG: k = " << k << "  res^2 = " << r_norm2 << std::endl;

 #endif


       // Algorithm from page 529 of Golub and Van Loan

       while(toBool(r_norm2>rsd_sq)){

         /** preconditioning algorithm **/

         z[A.subset()]=r ; // not optimal but do it for now...

         /**/

         for(int i(startV);i<endV;i++){

           DComplex d = innerProduct(evec[i],r,A.subset()) ;

           //QDPIO::cout<<"vecPrecondCG: "<< d<<" "<<(1.0/eval[i]-1.0)<<std::endl;

           z[A.subset()] += (1.0/eval[i]-1.0)*d*evec[i];

         }

         /**/

         /**/

         r_dot_z = innerProductReal(r,z,A.subset());

         k++ ;

         if(k==1){

           p[A.subset()] = z ;

         }

         else{

           beta = r_dot_z/r_dot_z_old ;

           p[A.subset()] = z + beta*p ;

         }

         //Cheb.Qsq(Ap,p) ;

         A(Ap,p,PLUS) ;

         pAp = innerProductReal(p,Ap,A.subset());


         alpha = r_dot_z/pAp ;

         x[A.subset()] += alpha*p ;

         r[A.subset()] -= alpha*Ap ;

         r_norm2 =  norm2(r,A.subset()) ;

         r_dot_z_old = r_dot_z ;


         if(k>MaxCG){

           res.n_count = k ;

           QDP_error_exit("too many CG iterations: count = %d", res.n_count);

           return res;

         }

 #if 1

         QDPIO::cout << "vecPrecondCG: k = " << k << "  res^2 = " << r_norm2 ;

         QDPIO::cout << "  r_dot_z = " << r_dot_z << std::endl;

 #endif

       }


       res.n_count = k ;

       res.resid   = sqrt(r_norm2);

       swatch.stop();

       QDPIO::cout << "vPreconfCG: k = " << k << std::endl;

       flopcount.report("vPrecondCG", swatch.getTimeInSeconds());

       END_CODE();

       return res ;

     }


     template<typename T>

     void InitGuess_T(const LinearOperator<T>& A,

                      T& x,

                      const T& b,

                      const multi1d<Double>& eval,

                      const multi1d<T>& evec,

                      int& n_count)

     {

       int N = evec.size();

       InitGuess(A,x,b,eval,evec,N,n_count);

     }


     template<typename T>

     void InitGuess_T(const LinearOperator<T>& A,

                      T& x,

                      const T& b,

                      const multi1d<Double>& eval,

                      const multi1d<T>& evec,

                      int N, // number of vectors to use

                      int& n_count)

     {

       T Ap;

       T r ;


       StopWatch snoop;

       //snoop.reset();

       //snoop.start();


       A(Ap,x,PLUS) ;

       r[A.subset()] = b - Ap ;

       // Double r_norm2 = norm2(r,A.subset()) ;


       for(int i(0);i<N;i++){

         DComplex d = innerProduct(evec[i],r,A.subset());

         x[A.subset()] += (d/eval[i])*evec[i];

         //QDPIO::cout<<"InitCG: "<<d<<" "<<eval[i]<<std::endl ;


       }


       //snoop.stop();

       /**

       QDPIO::cout << "InitGuess:  time = "

                   << snoop.getTimeInSeconds()

                   << " secs" << std::endl;

       **/

       n_count = 1 ;

     }


     //

     // Wrappers

     //

     // LatticeFermionF

     void SubSpaceMatrix(LinAlg::Matrix<DComplex>& H,

                         const LinearOperator<LatticeFermionF>& A,

                         const multi1d<LatticeFermionF>& evec,

                         int Nvecs)

     {

       SubSpaceMatrix_T<LatticeFermionF>(H, A, evec, Nvecs);

     }


     void SubSpaceMatrix(LinAlg::Matrix<DComplex>& H,

                         const LinearOperator<LatticeFermionF>& A,

                         const multi1d<LatticeFermionF>& evec,

                         const multi1d<Double>& eval,

                         int Nvecs,int NgoodEvecs){

       SubSpaceMatrix_T<LatticeFermionF>(H, A, evec, eval, Nvecs, NgoodEvecs) ;

     }


     SystemSolverResults_t InvEigCG2(const LinearOperator<LatticeFermionF>& A,

                                     LatticeFermionF& x,

                                     const LatticeFermionF& b,

                                     multi1d<Double>& eval,

                                     multi1d<LatticeFermionF>& evec,

                                     int Neig,

                                     int Nmax,

                                     const Real& RsdCG, int MaxCG,

                                     const int PrintLevel)

     {

       return InvEigCG2_T<LatticeFermionF>(A, x, b, eval, evec, Neig, Nmax, RsdCG, MaxCG, PrintLevel);

     }


     SystemSolverResults_t vecPrecondCG(const LinearOperator<LatticeFermionF>& A,

                                        LatticeFermionF& x,

                                        const LatticeFermionF& b,

                                        const multi1d<Double>& eval,

                                        const multi1d<LatticeFermionF>& evec,

                                        int startV, int endV,

                                        const Real& RsdCG, int MaxCG)

     {

       return vecPrecondCG_T<LatticeFermionF>(A, x, b, eval, evec, startV, endV, RsdCG, MaxCG);

     }


     void InitGuess(const LinearOperator<LatticeFermionF>& A,

                    LatticeFermionF& x,

                    const LatticeFermionF& b,

                    const multi1d<Double>& eval,

                    const multi1d<LatticeFermionF>& evec,

                    int& n_count)

     {

       InitGuess_T(A, x, b, eval, evec, n_count);

     }


     void InitGuess(const LinearOperator<LatticeFermionF>& A,

                    LatticeFermionF& x,

                    const LatticeFermionF& b,

                    const multi1d<Double>& eval,

                    const multi1d<LatticeFermionF>& evec,

                    int N, // number of vectors to use

                    int& n_count)

     {

       InitGuess_T(A, x, b, eval, evec, N, n_count);

     }


     // LatticeFermionD

     void SubSpaceMatrix(LinAlg::Matrix<DComplex>& H,

                         const LinearOperator<LatticeFermionD>& A,

                         const multi1d<LatticeFermionD>& evec,

                         int Nvecs)

     {

       SubSpaceMatrix_T<LatticeFermionD>(H, A, evec, Nvecs);

     }


     void SubSpaceMatrix(LinAlg::Matrix<DComplex>& H,

                         const LinearOperator<LatticeFermionD>& A,

                         const multi1d<LatticeFermionD>& evec,

                         const multi1d<Double>& eval,

                         int Nvecs,int NgoodEvecs){

       SubSpaceMatrix_T<LatticeFermionD>(H, A, evec, eval, Nvecs, NgoodEvecs) ;

     }


     SystemSolverResults_t InvEigCG2(const LinearOperator<LatticeFermionD>& A,

                                     LatticeFermionD& x,

                                     const LatticeFermionD& b,

                                     multi1d<Double>& eval,

                                     multi1d<LatticeFermionD>& evec,

                                     int Neig,

                                     int Nmax,

                                     const Real& RsdCG, int MaxCG,

                                     const int plvl)

     {

       return InvEigCG2_T<LatticeFermionD>(A, x, b, eval, evec, Neig, Nmax, RsdCG, MaxCG,plvl);

     }


     SystemSolverResults_t vecPrecondCG(const LinearOperator<LatticeFermionD>& A,

                                        LatticeFermionD& x,

                                        const LatticeFermionD& b,

                                        const multi1d<Double>& eval,

                                        const multi1d<LatticeFermionD>& evec,

                                        int startV, int endV,

                                        const Real& RsdCG, int MaxCG)

     {

       return vecPrecondCG_T<LatticeFermionD>(A, x, b, eval, evec, startV, endV, RsdCG, MaxCG);

     }


     void InitGuess(const LinearOperator<LatticeFermionD>& A,

                    LatticeFermionD& x,

                    const LatticeFermionD& b,

                    const multi1d<Double>& eval,

                    const multi1d<LatticeFermionD>& evec,

                    int& n_count)

     {

       InitGuess_T(A, x, b, eval, evec, n_count);

     }


     void InitGuess(const LinearOperator<LatticeFermionD>& A,

                    LatticeFermionD& x,

                    const LatticeFermionD& b,

                    const multi1d<Double>& eval,

                    const multi1d<LatticeFermionD>& evec,

                    int N, // number of vectors to use

                    int& n_count)

     {

       InitGuess_T(A, x, b, eval, evec, N, n_count);

     }

   } // namespace InvEigCG2Env


 }// End Namespace Chroma


Chroma::LinAlg::Matrix
This is a square matrix.
Definition: containers.h:328

Chroma::LinAlg::Matrix::N
int N
Definition: containers.h:331

Chroma::LinAlg::Matrix::size
int size() const
Definition: containers.h:345

Chroma::LinAlg::Matrix::mat
multi2d< T > mat
Definition: containers.h:330

Chroma::LinAlg::Vectors
Hold vectors.
Definition: containers.h:160

Chroma::LinAlg::Vectors::AddVectors
void AddVectors(multi1d< T > &v, const Subset &s)
Definition: containers.h:204

Chroma::LinAlg::Vectors::AddOrReplaceVector
void AddOrReplaceVector(const T &v, const Subset &s)
Definition: containers.h:193

Chroma::LinAlg::Vectors::N
int N
Definition: containers.h:163

Chroma::LinAlg::Vectors::NormalizeAndAddVector
void NormalizeAndAddVector(const T &v, const Double &inorm, const Subset &s)
Definition: containers.h:185

Chroma::LinAlg::Vectors::vec
multi1d< T > vec
Definition: containers.h:162

Chroma::LinearOperator
Linear Operator.
Definition: linearop.h:27

containers.h

Chroma::normGramSchmidt
void normGramSchmidt(multi1d< LatticeFermionF > &vec, int f, int t, const Subset &sub)
Gram-Schmidt with normalization.
Definition: norm_gram_schm.cc:80

inv_eigcg2.h
Conjugate-Gradient algorithm with eigenstd::vector acceleration.

j
unsigned j
Definition: ldumul_w.cc:35

z
int z
Definition: meslate.cc:36

x
int x
Definition: meslate.cc:34

Chroma::BaryonSpinMats::C
SpinMatrix C()
C = Gamma(10)
Definition: barspinmat_w.cc:29

Chroma::InlinePropAndMatElemDistillation2Env::local::innerProduct
BinaryReturn< C1, C2, FnInnerProduct >::Type_t innerProduct(const QDPSubType< T1, C1 > &s1, const QDPType< T2, C2 > &s2)
Definition: inline_prop_and_matelem_distillation2_w.cc:463

Chroma::InvEigCG2Env::vecPrecondCG
SystemSolverResults_t vecPrecondCG(const LinearOperator< LatticeFermionD > &A, LatticeFermionD &x, const LatticeFermionD &b, const multi1d< Double > &eval, const multi1d< LatticeFermionD > &evec, int startV, int endV, const Real &RsdCG, int MaxCG)
Definition: inv_eigcg2.cc:1249

Chroma::InvEigCG2Env::InitGuess
void InitGuess(const LinearOperator< LatticeFermionD > &A, LatticeFermionD &x, const LatticeFermionD &b, const multi1d< Double > &eval, const multi1d< LatticeFermionD > &evec, int N, int &n_count)
Definition: inv_eigcg2.cc:1270

Chroma::InvEigCG2Env::new_InvEigCG2_T
SystemSolverResults_t new_InvEigCG2_T(const LinearOperator< T > &A, T &x, const T &b, multi1d< Double > &eval, multi1d< T > &evec, int Neig, int Nmax, const Real &RsdCG, int MaxCG, const int PrintLevel)
Definition: inv_eigcg2.cc:98

Chroma::InvEigCG2Env::SubSpaceMatrix
void SubSpaceMatrix(LinAlg::Matrix< DComplex > &H, const LinearOperator< LatticeFermionD > &A, const multi1d< LatticeFermionD > &evec, const multi1d< Double > &eval, int Nvecs, int NgoodEvecs)
Definition: inv_eigcg2.cc:1227

Chroma::InvEigCG2Env::vecPrecondCG_T
SystemSolverResults_t vecPrecondCG_T(const LinearOperator< T > &A, T &x, const T &b, const multi1d< Double > &eval, const multi1d< T > &evec, int startV, int endV, const Real &RsdCG, int MaxCG)
Definition: inv_eigcg2.cc:1010

Chroma::InvEigCG2Env::InvEigCG2_T
SystemSolverResults_t InvEigCG2_T(const LinearOperator< T > &A, T &x, const T &b, multi1d< Double > &eval, multi1d< T > &evec, int Neig, int Nmax, const Real &RsdCG, int MaxCG, const int PrintLevel)
Definition: inv_eigcg2.cc:373

Chroma::InvEigCG2Env::SubSpaceMatrix_T
void SubSpaceMatrix_T(LinAlg::Matrix< DComplex > &H, const LinearOperator< T > &A, const multi1d< T > &evec, const multi1d< Double > &eval, int Nvecs, int NgoodEvecs)
Definition: inv_eigcg2.cc:62

Chroma::InvEigCG2Env::InitGuess_T
void InitGuess_T(const LinearOperator< T > &A, T &x, const T &b, const multi1d< Double > &eval, const multi1d< T > &evec, int N, int &n_count)
Definition: inv_eigcg2.cc:1116

Chroma::InvEigCG2Env::InvEigCG2
SystemSolverResults_t InvEigCG2(const LinearOperator< LatticeFermionD > &A, LatticeFermionD &x, const LatticeFermionD &b, multi1d< Double > &eval, multi1d< LatticeFermionD > &evec, int Neig, int Nmax, const Real &RsdCG, int MaxCG, const int plvl)
Definition: inv_eigcg2.cc:1236

Chroma::StagPhases::beta
static const LatticeInteger & beta(const int dim)
Definition: stag_phases_s.h:47

Chroma::StagPhases::alpha
static const LatticeInteger & alpha(const int dim)
Definition: stag_phases_s.h:43

Chroma
Asqtad Staggered-Dirac operator.
Definition: klein_gord.cc:10

Chroma::RsdCG
const WilsonTypeFermAct< multi1d< LatticeFermion > > Handle< const ConnectState > const multi1d< Real > enum InvType invType const multi1d< Real > & RsdCG
Definition: pbg5p_w.cc:30

Chroma::QDP_error_exit
QDP_error_exit("too many BiCG iterations", n_count, rsd_sq, cp, c, re_rvr, im_rvr, re_a, im_a, re_b, im_b)

Chroma::n_count
int n_count
Definition: invbicg.cc:78

Chroma::p
p
Definition: invbicg.cc:157

Chroma::tmp
LatticeFermion tmp
Definition: mespbg5p_w.cc:36

Chroma::T
LinOpSysSolverMGProtoClover::T T
Definition: syssolver_linop_clover_mg_proto.cc:63

Chroma::MaxCG
const WilsonTypeFermAct< multi1d< LatticeFermion > > Handle< const ConnectState > const multi1d< Real > enum InvType invType const multi1d< Real > int MaxCG
Definition: pbg5p_w.cc:32

Chroma::rsd_sq
Real rsd_sq
Definition: invbicg.cc:121

Chroma::i
int i
Definition: pbg5p_w.cc:55

Chroma::PLUS
@ PLUS
Definition: chromabase.h:45

Chroma::r
r
Definition: invbicg.cc:137

Chroma::d
DComplex d
Definition: invbicg.cc:99

Chroma::START_CODE
START_CODE()

Chroma::A
A(A, psi, r, Ncb, PLUS)

Chroma::END_CODE
END_CODE()

Chroma::b
Complex b
Definition: invbicg.cc:96

Chroma::zero
Double zero
Definition: invbicg.cc:106

Chroma::k
int k
Definition: invbicg.cc:119

Octave::tag
std::string tag(const std::string &prefix)
Definition: octave.h:15

testing::internal::Double
FloatingPoint< double > Double
Definition: gtest.h:7351

norm_gram_schm.h
Gram-Schmidt with normalization.

Chroma::SystemSolverResults_t
Holds return info from SystemSolver call.
Definition: syssolver.h:17

Chroma::SystemSolverResults_t::n_count
int n_count
Definition: syssolver.h:20

Chroma::SystemSolverResults_t::resid
Real resid
Definition: syssolver.h:21

U
multi1d< LatticeColorMatrix > U
Definition: t_aniso_gaugeact.cc:11

T
LatticeFermion T
Definition: t_clover.cc:11