www/dox/multi__syssolver__mdagm__cg__wilson__quda__w_8h_source.html

 // -*- C++ -*-

 /*! \file

  *  \brief Solve a MdagM*psi=chi linear system by CG2 using CG

  */


 #ifndef __multi_syssolver_mdagm_cg_wilson_quda_w_h__

 #define __multi_syssolver_mdagm_cg_wilson_quda_w_h__


 #include "chroma_config.h"


 #ifdef BUILD_QUDA


 #include "handle.h"

 #include "syssolver.h"

 #include "linearop.h"

 #include "lmdagm.h"

 #include "actions/ferm/fermbcs/simple_fermbc.h"

 #include "actions/ferm/fermstates/periodic_fermstate.h"

 #include "actions/ferm/invert/quda_solvers/syssolver_quda_wilson_params.h"

 #include "meas/gfix/temporal_gauge.h"

 #include "io/aniso_io.h"

 #include <string>


 #include "util/gauge/reunit.h"


 #include <quda.h>


 namespace Chroma

 {


   //! CG2 system solver namespace

   namespace MdagMMultiSysSolverCGQudaWilsonEnv

   {

     //! Register the syssolver

     bool registerAll();

   }


   //! Solve a CG2 system. Here, the operator is NOT assumed to be hermitian

   /*! \ingroup invert

    */

   class MdagMMultiSysSolverCGQudaWilson : public MdagMMultiSystemSolver<LatticeFermion>

   {

   public:

     typedef LatticeFermion T;

     typedef LatticeColorMatrix U;

     typedef multi1d<LatticeColorMatrix> Q;

     typedef multi1d<LatticeColorMatrix> P;


     typedef LatticeFermionF TF;

     typedef LatticeColorMatrixF UF;

     typedef multi1d<LatticeColorMatrixF> QF;

     typedef multi1d<LatticeColorMatrixF> PF;


     typedef LatticeFermionD TD;

     typedef LatticeColorMatrixD UD;

     typedef multi1d<LatticeColorMatrixD> QD;

     typedef multi1d<LatticeColorMatrixD> PD;


     typedef WordType<T>::Type_t REALT;

     //! Constructor

     /*!

      * \param M_        Linear operator ( Read )

      * \param invParam  inverter parameters ( Read )

      */

     MdagMMultiSysSolverCGQudaWilson(Handle< LinearOperator<T> > M_,

                                       Handle< FermState<T,P,Q> > state_,

                                       const SysSolverQUDAWilsonParams& invParam_) :

       A(M_), invParam(invParam_)


     {

       QDPIO::cout << "MdagMMultiSysSolverCGQUDAWilson: " << std::endl;

       // FOLLOWING INITIALIZATION in test QUDA program


       // 1) work out cpu_prec, cuda_prec, cuda_prec_sloppy

       int s = sizeof( WordType<T>::Type_t );

       if (s == 4) {

         cpu_prec = QUDA_SINGLE_PRECISION;

       }

       else {

         cpu_prec = QUDA_DOUBLE_PRECISION;

       }


       // Work out GPU precision

       switch( invParam.cudaPrecision ) {

       case HALF:

         gpu_prec = QUDA_HALF_PRECISION;

         break;

       case SINGLE:

         gpu_prec = QUDA_SINGLE_PRECISION;

         break;

       case DOUBLE:

         gpu_prec = QUDA_DOUBLE_PRECISION;

         break;

       default:

         gpu_prec = cpu_prec;

         break;

       }


       gpu_half_prec = gpu_prec;


       // 2) pull 'new; GAUGE and Invert params

       //

       QDPIO::cout << " Calling new QUDA Invert Param" << std::endl;

       q_gauge_param = newQudaGaugeParam();

       quda_inv_param = newQudaInvertParam();


       // 3) set lattice size

       const multi1d<int>& latdims = Layout::subgridLattSize();


       q_gauge_param.X[0] = latdims[0];

       q_gauge_param.X[1] = latdims[1];

       q_gauge_param.X[2] = latdims[2];

       q_gauge_param.X[3] = latdims[3];


       // 4) - deferred (anisotropy)


       // 5) - set QUDA_WILSON_LINKS, QUDA_GAUGE_ORDER

       q_gauge_param.type = QUDA_WILSON_LINKS;

       q_gauge_param.gauge_order = QUDA_QDP_GAUGE_ORDER; // gauge[mu], p


       // 6) - set t_boundary

       // Convention: BC has to be applied already

       // This flag just tells QUDA that this is so,

       // so that QUDA can take care in the reconstruct

       if( invParam.AntiPeriodicT ) {

         q_gauge_param.t_boundary = QUDA_ANTI_PERIODIC_T;

       }

       else {

         q_gauge_param.t_boundary = QUDA_PERIODIC_T;

       }


       // Set cpu_prec, cuda_prec, reconstruct and sloppy versions

       q_gauge_param.cpu_prec = cpu_prec;

       q_gauge_param.cuda_prec = gpu_prec;


       switch( invParam.cudaReconstruct ) {

       case RECONS_NONE:

         q_gauge_param.reconstruct = QUDA_RECONSTRUCT_NO;

         break;

       case RECONS_8:

         q_gauge_param.reconstruct = QUDA_RECONSTRUCT_8;

         break;

       case RECONS_12:

         q_gauge_param.reconstruct = QUDA_RECONSTRUCT_12;

         break;

       default:

         q_gauge_param.reconstruct = QUDA_RECONSTRUCT_12;

         break;

       };


       q_gauge_param.cuda_prec_sloppy = gpu_half_prec;


       switch( invParam.cudaSloppyReconstruct ) {

       case RECONS_NONE:

         q_gauge_param.reconstruct_sloppy = QUDA_RECONSTRUCT_NO;

         break;

       case RECONS_8:

         q_gauge_param.reconstruct_sloppy = QUDA_RECONSTRUCT_8;

         break;

       case RECONS_12:

         q_gauge_param.reconstruct_sloppy = QUDA_RECONSTRUCT_12;

         break;

       default:

         q_gauge_param.reconstruct_sloppy = QUDA_RECONSTRUCT_12;

         break;

       };


       // Gauge fixing:


       // These are the links

       // They may be smeared and the BC's may be applied

       Q links_single(Nd);


       // Now downcast to single prec fields.

       for(int mu=0; mu < Nd; mu++) {

         links_single[mu] = (state_->getLinks())[mu];

       }


      // GaugeFix

       if( invParam.axialGaugeP ) {

         QDPIO::cout << "Fixing Temporal Gauge" << std::endl;

         temporalGauge(links_single, GFixMat, Nd-1);

         for(int mu=0; mu < Nd; mu++){

           links_single[mu] = GFixMat*(state_->getLinks())[mu]*adj(shift(GFixMat, FORWARD, mu));

         }

         q_gauge_param.gauge_fix = QUDA_GAUGE_FIXED_YES;

       }

       else {

         // No GaugeFix

         q_gauge_param.gauge_fix = QUDA_GAUGE_FIXED_NO;  // No Gfix yet

       }


       // deferred 4) Gauge Anisotropy

       const AnisoParam_t& aniso = invParam.WilsonParams.anisoParam;

       if( aniso.anisoP ) {                     // Anisotropic case

         Real gamma_f = aniso.xi_0 / aniso.nu;

         q_gauge_param.anisotropy = toDouble(gamma_f);

       }

       else {

         q_gauge_param.anisotropy = 1.0;

       }


       // MAKE FSTATE BEFORE RESCALING links_single

       // Because the clover term expects the unrescaled links...

       Handle<FermState<T,Q,Q> > fstate( new PeriodicFermState<T,Q,Q>(links_single));


       if( aniso.anisoP ) {                     // Anisotropic case

         multi1d<Real> cf=makeFermCoeffs(aniso);

         for(int mu=0; mu < Nd; mu++) {

           links_single[mu] *= cf[mu];

         }

       }


       // Now onto the inv param:

       // Dslash type

       quda_inv_param.dslash_type = QUDA_WILSON_DSLASH;

       solver_string = "MULTI_CG";

       quda_inv_param.inv_type = QUDA_CG_INVERTER;


       // Mass

       Real massParam = Real(1) + Real(3)/Real(q_gauge_param.anisotropy) + invParam.WilsonParams.Mass;

       quda_inv_param.kappa = 1.0/(2*toDouble(massParam));


       // FIXME: We set clover coeff to a dummy value. This is dumb

       // If we ever get QUDA to compute our clvoer term we will need to fix this.

       // Right now it doesn't matter because we pass our own clover term

       quda_inv_param.clover_coeff = 1.0; // dummy value


       quda_inv_param.mass_normalization = QUDA_ASYMMETRIC_MASS_NORMALIZATION;


       quda_inv_param.tol = toDouble(invParam.RsdTarget);

       quda_inv_param.maxiter = invParam.MaxIter;

       quda_inv_param.reliable_delta = toDouble(invParam.Delta);

       quda_inv_param.pipeline = invParam.Pipeline;


       // Solution type

       quda_inv_param.solution_type = QUDA_MATPCDAG_MATPC_SOLUTION;


       // Solve type

       switch( invParam.solverType ) {

       case CG:

         quda_inv_param.solve_type = QUDA_NORMOP_PC_SOLVE;

         break;

       default:

         QDPIO::cerr << "Only CG Is currently implemented for multi-shift" << std::endl;

         QDP_abort(1);


         break;

       }


       if( invParam.asymmetricP ) {

         QDPIO::cout << "Asymmetric LinOP" << std::endl;

         quda_inv_param.matpc_type = QUDA_MATPC_ODD_ODD_ASYMMETRIC;

       }

       else {

         QDPIO::cout << "Symmetric LinOp" << std::endl;

         quda_inv_param.matpc_type = QUDA_MATPC_ODD_ODD;

       }


       quda_inv_param.dagger = QUDA_DAG_NO;


       quda_inv_param.cpu_prec = cpu_prec;

       quda_inv_param.cuda_prec = gpu_prec;

       quda_inv_param.cuda_prec_sloppy = gpu_half_prec;

       quda_inv_param.preserve_source = QUDA_PRESERVE_SOURCE_YES;

       quda_inv_param.dirac_order = QUDA_DIRAC_ORDER;

       quda_inv_param.gamma_basis = QUDA_DEGRAND_ROSSI_GAMMA_BASIS;


       // Autotuning

       if( invParam.tuneDslashP ) {

         QDPIO::cout << "Enabling Dslash Autotuning" << std::endl;


         quda_inv_param.tune = QUDA_TUNE_YES;

       }

       else {

         QDPIO::cout << "Disabling Dslash Autotuning" << std::endl;


         quda_inv_param.tune = QUDA_TUNE_NO;

       }


       // PADDING


       // Setup padding

       multi1d<int> face_size(4);

       face_size[0] = latdims[1]*latdims[2]*latdims[3]/2;

       face_size[1] = latdims[0]*latdims[2]*latdims[3]/2;

       face_size[2] = latdims[0]*latdims[1]*latdims[3]/2;

       face_size[3] = latdims[0]*latdims[1]*latdims[2]/2;


       int max_face = face_size[0];

       for(int i=1; i <=3; i++) {

         if ( face_size[i] > max_face ) {

           max_face = face_size[i];

         }

       }


       q_gauge_param.ga_pad = max_face;

       quda_inv_param.sp_pad = 0;

       quda_inv_param.cl_pad = 0;


       // Setting GCR Preconditioner to defaults, as we don't use it..

       // This is kinda yucky.


       QDPIO::cout << "Setting Precondition stuff to defaults for not using" << std::endl;

       quda_inv_param.inv_type_precondition= QUDA_INVALID_INVERTER;

       quda_inv_param.tol_precondition = 1.0e-1;

       quda_inv_param.maxiter_precondition = 1000;

       quda_inv_param.verbosity_precondition = QUDA_SILENT;

       quda_inv_param.gcrNkrylov = 1;


       if( invParam.verboseP ) {

         quda_inv_param.verbosity = QUDA_VERBOSE;

       }

       else {

         quda_inv_param.verbosity = QUDA_SUMMARIZE;

       }


       // Set up the links

       void* gauge[4];


       for(int mu=0; mu < Nd; mu++) {

         gauge[mu] = (void *)&(links_single[mu].elem(all.start()).elem().elem(0,0).real());


       }


       loadGaugeQuda((void *)gauge, &q_gauge_param);


     }


     //! Destructor is automatic

     ~MdagMMultiSysSolverCGQudaWilson() {

       QDPIO::cout << "Destructing" << std::endl;

       freeGaugeQuda();

     }


     //! Return the subset on which the operator acts

     const Subset& subset() const {return A->subset();}


     //! Solver the linear system

     /*!

      * \param psi      solution ( Modify )

      * \param chi      source ( Read )

      * \return syssolver results

      */

     SystemSolverResults_t operator() (multi1d<T>& psi, const multi1d<Real>& shifts, const T& chi) const

     {

       START_CODE();

       StopWatch swatch;

       swatch.reset();

       swatch.start();

       SystemSolverResults_t res;

       res.n_count = 0;


       if ( invParam.axialGaugeP ) {

         T g_chi;

         multi1d<T> g_psi(psi.size());


         // Gauge Fix source and initial guess

         QDPIO::cout << "Gauge Fixing source and initial guess" << std::endl;

         g_chi[ rb[1] ]  = GFixMat * chi;

         for(int s=0; s < psi.size(); s++) {

           g_psi[s][ rb[1] ]  = zero; // All initial guesses are zero

         }


         QDPIO::cout << "Solving" << std::endl;

         res = qudaInvertMulti(

                          g_chi,

                          g_psi,

                          shifts);

         QDPIO::cout << "Untransforming solution." << std::endl;

         for(int s=0; s< psi.size(); s++) {

           psi[s][ rb[1]]  = adj(GFixMat)*g_psi[s];

         }


       }

       else {


         res = qudaInvertMulti(chi,

                          psi,

                          shifts);


       }


       swatch.stop();

       double time = swatch.getTimeInSeconds();


       if (invParam.verboseP )  {

         Double chinorm=norm2(chi, A->subset());

         multi1d<Double> r_rel(shifts.size());


         for(int i=0; i < shifts.size(); i++) {

           T tmp1,tmp2;

           tmp1 = zero;

           tmp2 = zero;


           (*A)(tmp1, psi[i], PLUS);

           (*A)(tmp2, tmp1, MINUS);  // tmp2 = A^\dagger A psi

           tmp2[ A->subset() ] += shifts[i]* psi[i]; // tmp2 = ( A^\dagger A + shift_i ) psi

           T r;

           r = zero;


           r[ A->subset() ] = chi - tmp2;

           r_rel[i] = sqrt(norm2(r, A->subset())/chinorm );

           QDPIO::cout << "r[" <<i <<"] = " << r_rel[i] << std::endl;

         }

       }

       QDPIO::cout << "MULTI_CG_QUDA_CLOVER_SOLVER: " << res.n_count << " iterations. Rsd = " << res.resid << std::endl;

  QDPIO::cout << "MULTI_CG_QUDA_CLOVER_SOLVER: "<<time<< " sec" << std::endl;

       END_CODE();


       return res;

     }


   private:

     // Hide default constructor

     MdagMMultiSysSolverCGQudaWilson() {}

     U GFixMat;

     QudaPrecision_s cpu_prec;

     QudaPrecision_s gpu_prec;

     QudaPrecision_s gpu_half_prec;


     Handle< LinearOperator<T> > A;

     const SysSolverQUDAWilsonParams invParam;

     QudaGaugeParam q_gauge_param;

     mutable QudaInvertParam quda_inv_param;


     SystemSolverResults_t qudaInvertMulti(const T& chi_s,

                                      multi1d<T>& psi_s,

                                      multi1d<Real> shifts

                                      )const ;


     std::string solver_string;


   };


 } // End namespace


 #endif

 #endif


aniso_io.h
Anisotropy parameters.

chroma_config.h

mu
int mu
Definition: cool.cc:24

Chroma::temporalGauge
void temporalGauge(multi1d< LatticeColorMatrix > &ug, LatticeColorMatrix &g, int decay_dir)
Temporal gauge fixing.
Definition: temporal_gauge.cc:26

Chroma::CG
@ CG
Definition: syssolver_qphix_clover_params.h:16

handle.h
Class for counted reference semantics.

linearop.h
Linear Operators.

lmdagm.h
M^dag*M composition of a linear operator.

Nd
Nd
Definition: meslate.cc:74

tmp2
Double tmp2
Definition: mesq.cc:30

Chroma::InlineDiscoEigCGEnv::P
multi1d< LatticeColorMatrix > P
Definition: inline_disco_eigcg_w.cc:315

Chroma::MdagMMultiSysSolverCGQudaWilsonEnv::registerAll
bool registerAll()
Register all the factories.
Definition: multi_syssolver_mdagm_cg_wilson_quda_w.cc:35

Chroma::SimpleBaryonSeqSourceEnv::operator()
multi1d< Hadron2PtContraction_t > operator()(const multi1d< LatticeColorMatrix > &u)

Chroma
Asqtad Staggered-Dirac operator.
Definition: klein_gord.cc:10

Chroma::Q
LinOpSysSolverMGProtoClover::Q Q
Definition: syssolver_linop_clover_mg_proto.cc:64

Chroma::T
LinOpSysSolverMGProtoClover::T T
Definition: syssolver_linop_clover_mg_proto.cc:63

Chroma::i
int i
Definition: pbg5p_w.cc:55

Chroma::MINUS
@ MINUS
Definition: chromabase.h:45

Chroma::PLUS
@ PLUS
Definition: chromabase.h:45

Chroma::chi
multi1d< LatticeFermion > chi(Ncb)

Chroma::r
r
Definition: invbicg.cc:137

Chroma::psi
LatticeFermion psi
Definition: mespbg5p_w.cc:35

Chroma::START_CODE
START_CODE()

Chroma::A
A(A, psi, r, Ncb, PLUS)

Chroma::END_CODE
END_CODE()

Chroma::zero
Double zero
Definition: invbicg.cc:106

Chroma::makeFermCoeffs
multi1d< Real > makeFermCoeffs(const AnisoParam_t &aniso)
Make fermion coefficients.
Definition: aniso_io.cc:63

Chroma::s
multi1d< LatticeFermion > s(Ncb)

Chroma::RECONS_12
@ RECONS_12
Definition: enum_quda_io.h:80

Chroma::RECONS_NONE
@ RECONS_NONE
Definition: enum_quda_io.h:78

Chroma::RECONS_8
@ RECONS_8
Definition: enum_quda_io.h:79

Chroma::SINGLE
@ SINGLE
Definition: enum_quda_io.h:54

Chroma::HALF
@ HALF
Definition: enum_quda_io.h:53

Chroma::DOUBLE
@ DOUBLE
Definition: enum_quda_io.h:55

testing::internal::Double
FloatingPoint< double > Double
Definition: gtest.h:7351

testing::internal::string
::std::string string
Definition: gtest.h:1979

periodic_fermstate.h
Periodic ferm state and a creator.

FORWARD
#define FORWARD
Definition: primitives.h:82

reunit.h
Reunitarize in place a color matrix to SU(N)

simple_fermbc.h
Simple fermionic BC.

syssolver.h
Linear system solvers.

syssolver_quda_wilson_params.h

U
multi1d< LatticeColorMatrix > U
Definition: t_aniso_gaugeact.cc:11

T
LatticeFermion T
Definition: t_clover.cc:11

Q
multi1d< LatticeColorMatrix > Q
Definition: t_clover.cc:12

QF
multi1d< LatticeColorMatrixF > QF
Definition: t_quda_tprec.cc:19

UF
LatticeColorMatrixF UF
Definition: t_quda_tprec.cc:18

PF
multi1d< LatticeColorMatrixF > PF
Definition: t_quda_tprec.cc:20

TD
LatticeFermionD TD
Definition: t_quda_tprec.cc:22

UD
LatticeColorMatrixD UD
Definition: t_quda_tprec.cc:23

TF
LatticeFermionF TF
Definition: t_quda_tprec.cc:17

PD
multi1d< LatticeColorMatrixD > PD
Definition: t_quda_tprec.cc:25

QD
multi1d< LatticeColorMatrixD > QD
Definition: t_quda_tprec.cc:24

temporal_gauge.h
Axial gauge fixing.