docs/html.1.2.x/Imp_2fopr__Wilson__impl_8cpp_source.html

 #include <valarray>

 using std::valarray;

 #include <string>

 using std::string;


 #include "fopr_Wilson_impl.h"


 #include "threadManager_OpenMP.h"


 //#define USE_SU2


 #if defined USE_GROUP_SU3

 #include "fopr_Wilson_impl_SU3.inc"

 #elif defined USE_GROUP_SU2

 #include "fopr_Wilson_impl_SU2.inc"

 #elif defined USE_GROUP_SU_N

 #include "fopr_Wilson_impl_SU_N.inc"

 #endif


 const std::string Fopr_Wilson::Fopr_Wilson_impl::class_name = "Fopr_Wilson_impl";


 //====================================================================

 void Fopr_Wilson::Fopr_Wilson_impl::init(string repr)

 {

   m_vl = CommonParameters::Vlevel();


   vout.general(m_vl, "%s: Construction of Wilson fermion operator(imp).\n", class_name.c_str());


   check_Nc();


   m_Nc  = CommonParameters::Nc();

   m_Nd  = CommonParameters::Nd();

   m_Nvc = 2 * m_Nc;

   m_Ndf = 2 * m_Nc * m_Nc;


   m_Nx = CommonParameters::Nx();

   m_Ny = CommonParameters::Ny();

   m_Nz = CommonParameters::Nz();

   m_Nt = CommonParameters::Nt();


   m_Nvol = CommonParameters::Nvol();

   m_Ndim = CommonParameters::Ndim();

   m_boundary.resize(m_Ndim);

   m_boundary2.resize(m_Ndim);


   m_repr = repr;


   m_GM.resize(m_Ndim + 1);


   GammaMatrixSet *gmset = GammaMatrixSet::New(m_repr);


   m_GM[0] = gmset->get_GM(GammaMatrixSet::GAMMA1);

   m_GM[1] = gmset->get_GM(GammaMatrixSet::GAMMA2);

   m_GM[2] = gmset->get_GM(GammaMatrixSet::GAMMA3);

   m_GM[3] = gmset->get_GM(GammaMatrixSet::GAMMA4);

   m_GM[4] = gmset->get_GM(GammaMatrixSet::GAMMA5);


   delete gmset;


   m_U = 0;


   m_mult     = &Fopr_Wilson::Fopr_Wilson_impl::mult_undef;

   m_mult_dag = &Fopr_Wilson::Fopr_Wilson_impl::mult_undef;


   if (m_repr == "Dirac") {

     m_D       = &Fopr_Wilson::Fopr_Wilson_impl::D_dirac;

     m_gm5     = &Fopr_Wilson::Fopr_Wilson_impl::gm5_dirac;

     m_mult_tp = &Fopr_Wilson::Fopr_Wilson_impl::mult_tp_dirac;

     m_mult_tm = &Fopr_Wilson::Fopr_Wilson_impl::mult_tm_dirac;

     m_D_ex    = &Fopr_Wilson::Fopr_Wilson_impl::D_ex_dirac;

   } else if (m_repr == "Chiral") {

     m_D       = &Fopr_Wilson::Fopr_Wilson_impl::D_chiral;

     m_gm5     = &Fopr_Wilson::Fopr_Wilson_impl::gm5_chiral;

     m_mult_tp = &Fopr_Wilson::Fopr_Wilson_impl::mult_tp_chiral;

     m_mult_tm = &Fopr_Wilson::Fopr_Wilson_impl::mult_tm_chiral;

     m_D_ex    = &Fopr_Wilson::Fopr_Wilson_impl::D_ex_chiral;

   } else {

     vout.crucial(m_vl, "%s: input repr is undefined.\n", class_name.c_str());

     abort();

   }


   m_w1.reset(m_Nvc * m_Nd, m_Nvol, 1);

   m_w2.reset(m_Nvc * m_Nd, m_Nvol, 1);


   int Nvx = m_Nvc * 2 * m_Ny * m_Nz * m_Nt;

   vcp1_xp = new double[Nvx];

   vcp2_xp = new double[Nvx];

   vcp1_xm = new double[Nvx];

   vcp2_xm = new double[Nvx];


   int Nvy = m_Nvc * 2 * m_Nx * m_Nz * m_Nt;

   vcp1_yp = new double[Nvy];

   vcp2_yp = new double[Nvy];

   vcp1_ym = new double[Nvy];

   vcp2_ym = new double[Nvy];


   int Nvz = m_Nvc * 2 * m_Nx * m_Ny * m_Nt;

   vcp1_zp = new double[Nvz];

   vcp2_zp = new double[Nvz];

   vcp1_zm = new double[Nvz];

   vcp2_zm = new double[Nvz];


   int Nvt = m_Nvc * 2 * m_Nx * m_Ny * m_Nz;

   vcp1_tp = new double[Nvt];

   vcp2_tp = new double[Nvt];

   vcp1_tm = new double[Nvt];

   vcp2_tm = new double[Nvt];


   setup_thread();

 }


 //====================================================================

 void Fopr_Wilson::Fopr_Wilson_impl::set_mode(std::string mode)

 {

   m_mode = mode;


   if (m_mode == "D") {

     m_mult     = &Fopr_Wilson::Fopr_Wilson_impl::D;

     m_mult_dag = &Fopr_Wilson::Fopr_Wilson_impl::Ddag;

   } else if (m_mode == "Ddag") {

     m_mult     = &Fopr_Wilson::Fopr_Wilson_impl::Ddag;

     m_mult_dag = &Fopr_Wilson::Fopr_Wilson_impl::D;

   } else if (m_mode == "DdagD") {

     m_mult     = &Fopr_Wilson::Fopr_Wilson_impl::DdagD;

     m_mult_dag = &Fopr_Wilson::Fopr_Wilson_impl::DdagD;

   } else if (m_mode == "DDdag") {

     m_mult     = &Fopr_Wilson::Fopr_Wilson_impl::DDdag;

     m_mult_dag = &Fopr_Wilson::Fopr_Wilson_impl::DDdag;

   } else if (m_mode == "H") {

     m_mult     = &Fopr_Wilson::Fopr_Wilson_impl::H;

     m_mult_dag = &Fopr_Wilson::Fopr_Wilson_impl::H;

   } else {

     vout.crucial(m_vl, "%s: input mode is undefined.\n", class_name.c_str());

     abort();

   }


 }


 //====================================================================

 void Fopr_Wilson::Fopr_Wilson_impl::tidyup()

 {

   delete[]  vcp1_xp;

   delete[]  vcp2_xp;

   delete[]  vcp1_xm;

   delete[]  vcp2_xm;


   delete[]  vcp1_yp;

   delete[]  vcp2_yp;

   delete[]  vcp1_ym;

   delete[]  vcp2_ym;


   delete[]  vcp1_zp;

   delete[]  vcp2_zp;

   delete[]  vcp1_zm;

   delete[]  vcp2_zm;


   delete[]  vcp1_tp;

   delete[]  vcp2_tp;

   delete[]  vcp1_tm;

   delete[]  vcp2_tm;

 }


 //====================================================================

 std::string Fopr_Wilson::Fopr_Wilson_impl::get_mode() const

 {

   return m_mode;

 }


 //====================================================================

 void Fopr_Wilson::Fopr_Wilson_impl::set_parameters(const double kappa,

                                                    const valarray<int> bc)

 {

   assert(bc.size() == m_Ndim);


   m_kappa = kappa;


   for (int mu = 0; mu < m_Ndim; ++mu) {

     m_boundary[mu] = bc[mu];

   }


   vout.general(m_vl, "%s: input parameters\n", class_name.c_str());

   vout.general(m_vl, "  kappa  = %8.4f\n", m_kappa);

   for (int mu = 0; mu < m_Ndim; ++mu) {

     vout.general(m_vl, "  boundary[%d] = %2d\n", mu, m_boundary[mu]);

   }


   // boundary condition for each node:

   for (int idir = 0; idir < m_Ndim; ++idir) {

     m_boundary2[idir] = 1.0;

     if (Communicator::ipe(idir) == 0) m_boundary2[idir] = m_boundary[idir];

   }


 }


 //====================================================================

 double Fopr_Wilson::Fopr_Wilson_impl::flop_count()

 {

   // The following counting explicitly depends on the implementation.

   // It will be recalculated when the code is modified.

   // The present counting is based on rev.1107. [24 Aug 2014 H.Matsufuru]


   int    Lvol = CommonParameters::Lvol();

   double flop_site, flop;


   if (m_repr == "Dirac") {

     flop_site = static_cast<double>(

       m_Nc * m_Nd * (4 + 6 * (4 * m_Nc + 2) + 2 * (4 * m_Nc + 1)));

   } else if (m_repr == "Chiral") {

     flop_site = static_cast<double>(

       m_Nc * m_Nd * (4 + 8 * (4 * m_Nc + 2)));

   } else {

     vout.crucial(m_vl, "%s: input repr is undefined.\n",

                  class_name.c_str());

     abort();

   }


   flop = flop_site * static_cast<double>(Lvol);


   if ((m_mode == "DdagD") || (m_mode == "DDdag")) flop *= 2.0;


   return flop;

 }


 //====================================================================

 void Fopr_Wilson::Fopr_Wilson_impl::D_dirac(Field& w, const Field& f)

 {

   D_ex_dirac(w, 0, f, 0);

 }


 //====================================================================

 void Fopr_Wilson::Fopr_Wilson_impl::D_chiral(Field& w, const Field& f)

 {

   D_ex_chiral(w, 0, f, 0);

 }


 //====================================================================

 void Fopr_Wilson::Fopr_Wilson_impl::mult_up(int mu,

                                             Field& w, const Field& f)

 {

   if (mu == 0) {

     mult_xp(w, f);

   } else if (mu == 1) {

     mult_yp(w, f);

   } else if (mu == 2) {

     mult_zp(w, f);

   } else if (mu == 3) {

     (this->*m_mult_tp)(w, f);

   } else {

     vout.crucial(m_vl, "%s: illegal direction of mu in mult_up.\n", class_name.c_str());

     abort();

   }


 }


 //====================================================================

 void Fopr_Wilson::Fopr_Wilson_impl::mult_dn(int mu, Field& w, const Field& f)

 {

   if (mu == 0) {

     mult_xm(w, f);

   } else if (mu == 1) {

     mult_ym(w, f);

   } else if (mu == 2) {

     mult_zm(w, f);

   } else if (mu == 3) {

     (this->*m_mult_tm)(w, f);

   } else {

     vout.crucial(m_vl, "%s: illegal direction of mu in mult_dn.\n", class_name.c_str());

     abort();

   }


 }


 //====================================================================

 void Fopr_Wilson::Fopr_Wilson_impl::D_ex_dirac(Field& w, const int ex1,

                                                const Field& f, const int ex2)

 {

   int    Ninvol = m_Nvc * m_Nd * m_Nvol;

   double *v1    = const_cast<Field *>(&f)->ptr(Ninvol * ex2);

   double *v2    = w.ptr(Ninvol * ex1);


   int nth = ThreadManager_OpenMP::get_num_threads();

   int ith = ThreadManager_OpenMP::get_thread_id();


   int is = m_Ntask * ith / nth;

   int ns = m_Ntask * (ith + 1) / nth - is;


   for (int i = is; i < is + ns; ++i) {

     mult_xp1_thread(i, vcp1_xp, v1);

     mult_xm1_thread(i, vcp1_xm, v1);

     mult_yp1_thread(i, vcp1_yp, v1);

     mult_ym1_thread(i, vcp1_ym, v1);

     mult_zp1_thread(i, vcp1_zp, v1);

     mult_zm1_thread(i, vcp1_zm, v1);

     mult_tp1_dirac_thread(i, vcp1_tp, v1);

     mult_tm1_dirac_thread(i, vcp1_tm, v1);

   }

   #pragma omp barrier


   #pragma omp master

   {

     int Nvx = m_Nvc * 2 * m_Ny * m_Nz * m_Nt;

     Communicator::exchange(Nvx, vcp2_xp, vcp1_xp, 0, 1, 1);

     Communicator::exchange(Nvx, vcp2_xm, vcp1_xm, 0, -1, 2);


     int Nvy = m_Nvc * 2 * m_Nx * m_Nz * m_Nt;

     Communicator::exchange(Nvy, vcp2_yp, vcp1_yp, 1, 1, 3);

     Communicator::exchange(Nvy, vcp2_ym, vcp1_ym, 1, -1, 4);


     int Nvz = m_Nvc * 2 * m_Nx * m_Ny * m_Nt;

     Communicator::exchange(Nvz, vcp2_zp, vcp1_zp, 2, 1, 5);

     Communicator::exchange(Nvz, vcp2_zm, vcp1_zm, 2, -1, 6);


     int Nvt = m_Nvc * 2 * m_Nx * m_Ny * m_Nz;

     Communicator::exchange(Nvt, vcp2_tp, vcp1_tp, 3, 1, 7);

     Communicator::exchange(Nvt, vcp2_tm, vcp1_tm, 3, -1, 8);

   }

   #pragma omp barrier


   for (int i = is; i < is + ns; ++i) {

     clear_thread(i, v2);

     mult_xpb_thread(i, v2, v1);

     mult_xmb_thread(i, v2, v1);

     mult_ypb_thread(i, v2, v1);

     mult_ymb_thread(i, v2, v1);

     mult_zpb_thread(i, v2, v1);

     mult_zmb_thread(i, v2, v1);

     mult_tpb_dirac_thread(i, v2, v1);

     mult_tmb_dirac_thread(i, v2, v1);

   }


   for (int i = is; i < is + ns; ++i) {

     mult_xp2_thread(i, v2, vcp2_xp);

     mult_xm2_thread(i, v2, vcp2_xm);

     mult_yp2_thread(i, v2, vcp2_yp);

     mult_ym2_thread(i, v2, vcp2_ym);

     mult_zp2_thread(i, v2, vcp2_zp);

     mult_zm2_thread(i, v2, vcp2_zm);

     mult_tp2_dirac_thread(i, v2, vcp2_tp);

     mult_tm2_dirac_thread(i, v2, vcp2_tm);

     daypx_thread(i, v2, -m_kappa, v1);   // w = -m_kappa * w + f.

   }


   ThreadManager_OpenMP::sync_barrier_all();

 }


 //====================================================================

 void Fopr_Wilson::Fopr_Wilson_impl::D_ex_chiral(Field& w, const int ex1,

                                                 const Field& f, const int ex2)

 {

   int    Ninvol = m_Nvc * m_Nd * m_Nvol;

   double *v1    = const_cast<Field *>(&f)->ptr(Ninvol * ex2);

   double *v2    = w.ptr(Ninvol * ex1);


   int nth = ThreadManager_OpenMP::get_num_threads();

   int ith = ThreadManager_OpenMP::get_thread_id();


   int is = m_Ntask * ith / nth;

   int ns = m_Ntask * (ith + 1) / nth - is;


   for (int i = is; i < is + ns; ++i) {

     mult_xp1_thread(i, vcp1_xp, v1);

     mult_xm1_thread(i, vcp1_xm, v1);

     mult_yp1_thread(i, vcp1_yp, v1);

     mult_ym1_thread(i, vcp1_ym, v1);

     mult_zp1_thread(i, vcp1_zp, v1);

     mult_zm1_thread(i, vcp1_zm, v1);

     mult_tp1_chiral_thread(i, vcp1_tp, v1);

     mult_tm1_chiral_thread(i, vcp1_tm, v1);

   }

   #pragma omp barrier


   #pragma omp master

   {

     int Nvx = m_Nvc * 2 * m_Ny * m_Nz * m_Nt;

     Communicator::exchange(Nvx, vcp2_xp, vcp1_xp, 0, 1, 1);

     Communicator::exchange(Nvx, vcp2_xm, vcp1_xm, 0, -1, 2);


     int Nvy = m_Nvc * 2 * m_Nx * m_Nz * m_Nt;

     Communicator::exchange(Nvy, vcp2_yp, vcp1_yp, 1, 1, 3);

     Communicator::exchange(Nvy, vcp2_ym, vcp1_ym, 1, -1, 4);


     int Nvz = m_Nvc * 2 * m_Nx * m_Ny * m_Nt;

     Communicator::exchange(Nvz, vcp2_zp, vcp1_zp, 2, 1, 5);

     Communicator::exchange(Nvz, vcp2_zm, vcp1_zm, 2, -1, 6);


     int Nvt = m_Nvc * 2 * m_Nx * m_Ny * m_Nz;

     Communicator::exchange(Nvt, vcp2_tp, vcp1_tp, 3, 1, 7);

     Communicator::exchange(Nvt, vcp2_tm, vcp1_tm, 3, -1, 8);

   }

   #pragma omp barrier


   for (int i = is; i < is + ns; ++i) {

     clear_thread(i, v2);

     mult_xpb_thread(i, v2, v1);

     mult_xmb_thread(i, v2, v1);

     mult_ypb_thread(i, v2, v1);

     mult_ymb_thread(i, v2, v1);

     mult_zpb_thread(i, v2, v1);

     mult_zmb_thread(i, v2, v1);

     mult_tpb_chiral_thread(i, v2, v1);

     mult_tmb_chiral_thread(i, v2, v1);

   }


   for (int i = is; i < is + ns; ++i) {

     mult_xp2_thread(i, v2, vcp2_xp);

     mult_xm2_thread(i, v2, vcp2_xm);

     mult_yp2_thread(i, v2, vcp2_yp);

     mult_ym2_thread(i, v2, vcp2_ym);

     mult_zp2_thread(i, v2, vcp2_zp);

     mult_zm2_thread(i, v2, vcp2_zm);

     mult_tp2_chiral_thread(i, v2, vcp2_tp);

     mult_tm2_chiral_thread(i, v2, vcp2_tm);

     daypx_thread(i, v2, -m_kappa, v1);   // w = -m_kappa * w + f.

   }


   ThreadManager_OpenMP::sync_barrier_all();


   /*

    clear(w);

    mult_xp(w,f);

    mult_xm(w,f);

    mult_yp(w,f);

    mult_ym(w,f);

    mult_zp(w,f);

    mult_zm(w,f);

    mult_tp_chiral(w,f);

    mult_tm_chiral(w,f);

    daypx(w, -m_kappa, f);   // w = -m_kappa * w + f.

   */

 }


 //====================================================================

 void Fopr_Wilson::Fopr_Wilson_impl::mult_gm5p(int mu,

                                               Field& v, const Field& w)

 {

   clear(m_w2);


   mult_up(mu, m_w2, w);

   mult_gm5(v, m_w2);

 }


 //====================================================================

 void Fopr_Wilson::Fopr_Wilson_impl::proj_chiral(Field& w, const int ex1,

                                                 const Field& v, const int ex2, const int ipm)

 {

   double fpm = 0.0;


   if (ipm == 1) {

     fpm = 1.0;

   } else if (ipm == -1) {

     fpm = -1.0;

   } else {

     vout.crucial(m_vl, "%s: illegal chirality = %d.\n", class_name.c_str(), ipm);

     abort();

   }


   m_w1.setpart_ex(0, v, ex2);

   mult_gm5(m_w2, m_w1);

   m_w1.addpart_ex(0, m_w2, 0, fpm);

   w.setpart_ex(ex1, m_w1, 0);

 }


 //====================================================================

 void Fopr_Wilson::Fopr_Wilson_impl::daypx(Field& w,

                                           double fac, const Field& f)

 {

   double *v1 = const_cast<Field *>(&f)->ptr(0);

   double *v2 = w.ptr(0);


   int nth = ThreadManager_OpenMP::get_num_threads();

   int ith = ThreadManager_OpenMP::get_thread_id();


   int is = m_Ntask * ith / nth;

   int ns = m_Ntask * (ith + 1) / nth - is;


   for (int i = is; i < is + ns; ++i) {

     daypx_thread(i, v2, fac, v1);

   }


 }


 //====================================================================

 void Fopr_Wilson::Fopr_Wilson_impl::clear(Field& w)

 {

   double *v2 = w.ptr(0);


   int nth = ThreadManager_OpenMP::get_num_threads();

   int ith = ThreadManager_OpenMP::get_thread_id();


   int is = m_Ntask * ith / nth;

   int ns = m_Ntask * (ith + 1) / nth - is;


   for (int i = is; i < is + ns; ++i) {

     clear_thread(i, v2);

   }


 }


 //====================================================================

 void Fopr_Wilson::Fopr_Wilson_impl::gm5_dirac(Field& w, const Field& f)

 {

   double *v1 = const_cast<Field *>(&f)->ptr(0);

   double *v2 = w.ptr(0);


   int nth = ThreadManager_OpenMP::get_num_threads();

   int ith = ThreadManager_OpenMP::get_thread_id();


   int is = m_Ntask * ith / nth;

   int ns = m_Ntask * (ith + 1) / nth - is;


   for (int i = is; i < is + ns; ++i) {

     gm5_dirac_thread(i, v2, v1);

   }


 }


 //====================================================================

 void Fopr_Wilson::Fopr_Wilson_impl::gm5_chiral(Field& w, const Field& f)

 {

   double *v1 = const_cast<Field *>(&f)->ptr(0);

   double *v2 = w.ptr(0);


   int nth = ThreadManager_OpenMP::get_num_threads();

   int ith = ThreadManager_OpenMP::get_thread_id();


   int is = m_Ntask * ith / nth;

   int ns = m_Ntask * (ith + 1) / nth - is;


   for (int i = is; i < is + ns; ++i) {

     gm5_chiral_thread(i, v2, v1);

   }


 }


 //====================================================================

 void Fopr_Wilson::Fopr_Wilson_impl::mult_xp(Field& w, const Field& f)

 {

   double *v1 = const_cast<Field *>(&f)->ptr(0);

   double *v2 = w.ptr(0);


   int nth = ThreadManager_OpenMP::get_num_threads();

   int ith = ThreadManager_OpenMP::get_thread_id();


   int is = m_Ntask * ith / nth;

   int ns = m_Ntask * (ith + 1) / nth - is;


 #pragma omp barrier


   for (int i = is; i < is + ns; ++i) {

     mult_xp1_thread(i, vcp1_xp, v1);

   }

   #pragma omp barrier


   #pragma omp master

   {

     int Nv = m_Nvc * 2 * m_Ny * m_Nz * m_Nt;

     Communicator::exchange(Nv, vcp2_xp, vcp1_xp, 0, 1, 1);

   }

   #pragma omp barrier


   for (int i = is; i < is + ns; ++i) {

     mult_xpb_thread(i, v2, v1);

   }


   for (int i = is; i < is + ns; ++i) {

     mult_xp2_thread(i, v2, vcp2_xp);

   }


   ThreadManager_OpenMP::sync_barrier_all();

 }


 //====================================================================

 void Fopr_Wilson::Fopr_Wilson_impl::mult_xm(Field& w, const Field& f)

 {

   double *v2 = w.ptr(0);

   double *v1 = const_cast<Field *>(&f)->ptr(0);


   int nth = ThreadManager_OpenMP::get_num_threads();

   int ith = ThreadManager_OpenMP::get_thread_id();


   int is = m_Ntask * ith / nth;

   int ns = m_Ntask * (ith + 1) / nth - is;


 #pragma omp barrier


   for (int i = is; i < is + ns; ++i) {

     mult_xm1_thread(i, vcp1_xm, v1);

   }

   #pragma omp barrier


   #pragma omp master

   {

     int Nv = m_Nvc * 2 * m_Ny * m_Nz * m_Nt;

     Communicator::exchange(Nv, vcp2_xm, vcp1_xm, 0, -1, 2);

   }

   #pragma omp barrier


   for (int i = is; i < is + ns; ++i) {

     mult_xmb_thread(i, v2, v1);

   }


   for (int i = is; i < is + ns; ++i) {

     mult_xm2_thread(i, v2, vcp2_xm);

   }


   ThreadManager_OpenMP::sync_barrier_all();

 }


 //====================================================================

 void Fopr_Wilson::Fopr_Wilson_impl::mult_yp(Field& w, const Field& f)

 {

   double *v1 = const_cast<Field *>(&f)->ptr(0);

   double *v2 = w.ptr(0);


   int nth = ThreadManager_OpenMP::get_num_threads();

   int ith = ThreadManager_OpenMP::get_thread_id();


   int is = m_Ntask * ith / nth;

   int ns = m_Ntask * (ith + 1) / nth - is;


 #pragma omp barrier


   for (int i = is; i < is + ns; ++i) {

     mult_yp1_thread(i, vcp1_yp, v1);

   }

   #pragma omp barrier


   #pragma omp master

   {

     int Nv = m_Nvc * 2 * m_Nx * m_Nz * m_Nt;

     Communicator::exchange(Nv, vcp2_yp, vcp1_yp, 1, 1, 3);

   }

   #pragma omp barrier


   for (int i = is; i < is + ns; ++i) {

     mult_ypb_thread(i, v2, v1);

   }


   for (int i = is; i < is + ns; ++i) {

     mult_yp2_thread(i, v2, vcp2_yp);

   }


   ThreadManager_OpenMP::sync_barrier_all();

 }


 //====================================================================

 void Fopr_Wilson::Fopr_Wilson_impl::mult_ym(Field& w, const Field& f)

 {

   double *v2 = w.ptr(0);

   double *v1 = const_cast<Field *>(&f)->ptr(0);


   int nth = ThreadManager_OpenMP::get_num_threads();

   int ith = ThreadManager_OpenMP::get_thread_id();


   int is = m_Ntask * ith / nth;

   int ns = m_Ntask * (ith + 1) / nth - is;


 #pragma omp barrier


   for (int i = is; i < is + ns; ++i) {

     mult_ym1_thread(i, vcp1_ym, v1);

   }

   #pragma omp barrier


   #pragma omp master

   {

     int Nv = m_Nvc * 2 * m_Nx * m_Nz * m_Nt;

     Communicator::exchange(Nv, vcp2_ym, vcp1_ym, 1, -1, 4);

   }

   #pragma omp barrier


   for (int i = is; i < is + ns; ++i) {

     mult_ymb_thread(i, v2, v1);

   }


   for (int i = is; i < is + ns; ++i) {

     mult_ym2_thread(i, v2, vcp2_ym);

   }


   ThreadManager_OpenMP::sync_barrier_all();

 }


 //====================================================================

 void Fopr_Wilson::Fopr_Wilson_impl::mult_zp(Field& w, const Field& f)

 {

   double *v1 = const_cast<Field *>(&f)->ptr(0);

   double *v2 = w.ptr(0);


   int nth = ThreadManager_OpenMP::get_num_threads();

   int ith = ThreadManager_OpenMP::get_thread_id();


   int is = m_Ntask * ith / nth;

   int ns = m_Ntask * (ith + 1) / nth - is;


 #pragma omp barrier


   for (int i = is; i < is + ns; ++i) {

     mult_zp1_thread(i, vcp1_zp, v1);

   }

   #pragma omp barrier


   #pragma omp master

   {

     int Nv = m_Nvc * 2 * m_Nx * m_Ny * m_Nt;

     Communicator::exchange(Nv, vcp2_zp, vcp1_zp, 2, 1, 5);

   }

   #pragma omp barrier


   for (int i = is; i < is + ns; ++i) {

     mult_zpb_thread(i, v2, v1);

   }


   for (int i = is; i < is + ns; ++i) {

     mult_zp2_thread(i, v2, vcp2_zp);

   }


   ThreadManager_OpenMP::sync_barrier_all();

 }


 //====================================================================

 void Fopr_Wilson::Fopr_Wilson_impl::mult_zm(Field& w, const Field& f)

 {

   double *v2 = w.ptr(0);

   double *v1 = const_cast<Field *>(&f)->ptr(0);


   int nth = ThreadManager_OpenMP::get_num_threads();

   int ith = ThreadManager_OpenMP::get_thread_id();


   int is = m_Ntask * ith / nth;

   int ns = m_Ntask * (ith + 1) / nth - is;


 #pragma omp barrier


   for (int i = is; i < is + ns; ++i) {

     mult_zm1_thread(i, vcp1_zm, v1);

   }

   #pragma omp barrier


   #pragma omp master

   {

     int Nv = m_Nvc * 2 * m_Nx * m_Ny * m_Nt;

     Communicator::exchange(Nv, vcp2_zm, vcp1_zm, 2, -1, 6);

   }

   #pragma omp barrier


   for (int i = is; i < is + ns; ++i) {

     mult_zmb_thread(i, v2, v1);

   }


   for (int i = is; i < is + ns; ++i) {

     mult_zm2_thread(i, v2, vcp2_zm);

   }


   ThreadManager_OpenMP::sync_barrier_all();

 }


 //====================================================================

 void Fopr_Wilson::Fopr_Wilson_impl::mult_tp_dirac(Field& w, const Field& f)

 {

   double *v1 = const_cast<Field *>(&f)->ptr(0);

   double *v2 = w.ptr(0);


   int nth = ThreadManager_OpenMP::get_num_threads();

   int ith = ThreadManager_OpenMP::get_thread_id();


   int is = m_Ntask * ith / nth;

   int ns = m_Ntask * (ith + 1) / nth - is;


 #pragma omp barrier


   for (int i = is; i < is + ns; ++i) {

     mult_tp1_dirac_thread(i, vcp1_tp, v1);

   }

   #pragma omp barrier


   #pragma omp master

   {

     int Nv = m_Nvc * 2 * m_Nx * m_Ny * m_Nz;

     Communicator::exchange(Nv, vcp2_tp, vcp1_tp, 3, 1, 7);

   }

   #pragma omp barrier


   for (int i = is; i < is + ns; ++i) {

     mult_tpb_dirac_thread(i, v2, v1);

   }


   for (int i = is; i < is + ns; ++i) {

     mult_tp2_dirac_thread(i, v2, vcp2_tp);

   }


   ThreadManager_OpenMP::sync_barrier_all();

 }


 //====================================================================

 void Fopr_Wilson::Fopr_Wilson_impl::mult_tm_dirac(Field& w, const Field& f)

 {

   double *v2 = w.ptr(0);

   double *v1 = const_cast<Field *>(&f)->ptr(0);


   int nth = ThreadManager_OpenMP::get_num_threads();

   int ith = ThreadManager_OpenMP::get_thread_id();


   int is = m_Ntask * ith / nth;

   int ns = m_Ntask * (ith + 1) / nth - is;


 #pragma omp barrier


   for (int i = is; i < is + ns; ++i) {

     mult_tm1_dirac_thread(i, vcp1_tm, v1);

   }

   #pragma omp barrier


   #pragma omp master

   {

     int Nv = m_Nvc * 2 * m_Nx * m_Ny * m_Nz;

     Communicator::exchange(Nv, vcp2_tm, vcp1_tm, 3, -1, 8);

   }

   #pragma omp barrier


   for (int i = is; i < is + ns; ++i) {

     mult_tmb_dirac_thread(i, v2, v1);

   }


   for (int i = is; i < is + ns; ++i) {

     mult_tm2_dirac_thread(i, v2, vcp2_tm);

   }


   ThreadManager_OpenMP::sync_barrier_all();

 }


 //====================================================================

 void Fopr_Wilson::Fopr_Wilson_impl::mult_tp_chiral(Field& w, const Field& f)

 {

   double *v1 = const_cast<Field *>(&f)->ptr(0);

   double *v2 = w.ptr(0);


   int nth = ThreadManager_OpenMP::get_num_threads();

   int ith = ThreadManager_OpenMP::get_thread_id();


   int is = m_Ntask * ith / nth;

   int ns = m_Ntask * (ith + 1) / nth - is;


 #pragma omp barrier


   for (int i = is; i < is + ns; ++i) {

     mult_tp1_chiral_thread(i, vcp1_tp, v1);

   }

   #pragma omp barrier


   #pragma omp master

   {

     int Nv = m_Nvc * 2 * m_Nx * m_Ny * m_Nz;

     Communicator::exchange(Nv, vcp2_tp, vcp1_tp, 3, 1, 7);

   }

   #pragma omp barrier


   for (int i = is; i < is + ns; ++i) {

     mult_tpb_chiral_thread(i, v2, v1);

   }


   for (int i = is; i < is + ns; ++i) {

     mult_tp2_chiral_thread(i, v2, vcp2_tp);

   }


   ThreadManager_OpenMP::sync_barrier_all();

 }


 //====================================================================

 void Fopr_Wilson::Fopr_Wilson_impl::mult_tm_chiral(Field& w, const Field& f)

 {

   double *v2 = w.ptr(0);

   double *v1 = const_cast<Field *>(&f)->ptr(0);


   int nth = ThreadManager_OpenMP::get_num_threads();

   int ith = ThreadManager_OpenMP::get_thread_id();


   int is = m_Ntask * ith / nth;

   int ns = m_Ntask * (ith + 1) / nth - is;


 #pragma omp barrier


   for (int i = is; i < is + ns; ++i) {

     mult_tm1_chiral_thread(i, vcp1_tm, v1);

   }

   #pragma omp barrier


   #pragma omp master

   {

     int Nv = m_Nvc * 2 * m_Nx * m_Ny * m_Nz;

     Communicator::exchange(Nv, vcp2_tm, vcp1_tm, 3, -1, 8);

   }

   #pragma omp barrier


   for (int i = is; i < is + ns; ++i) {

     mult_tmb_chiral_thread(i, v2, v1);

   }


   for (int i = is; i < is + ns; ++i) {

     mult_tm2_chiral_thread(i, v2, vcp2_tm);

   }


   ThreadManager_OpenMP::sync_barrier_all();

 }


 //====================================================================

 //============================================================END=====

Fopr_Wilson::Fopr_Wilson_impl::daypx
void daypx(Field &, double, const Field &)
Definition: fopr_Wilson_impl.cpp:477

CommonParameters::Nd
static int Nd()
Definition: commonParameters.h:103

Fopr_Wilson::Fopr_Wilson_impl::vcp1_xm
double * vcp1_xm
Definition: fopr_Wilson_impl.h:68

CommonParameters::Nc
static int Nc()
Definition: commonParameters.h:102

Fopr_Wilson::Fopr_Wilson_impl::mult_zp
void mult_zp(Field &, const Field &)
Definition: fopr_Wilson_impl.cpp:697

Bridge::vout
BridgeIO vout
Definition: bridgeIO.cpp:207

threadManager_OpenMP.h

Fopr_Wilson::Fopr_Wilson_impl::vcp1_zp
double * vcp1_zp
Definition: fopr_Wilson_impl.h:70

ThreadManager_OpenMP::get_num_threads
static int get_num_threads()
returns available number of threads.
Definition: threadManager_OpenMP.cpp:95

Fopr_Wilson::Fopr_Wilson_impl::vcp2_yp
double * vcp2_yp
Definition: fopr_Wilson_impl.h:69

Fopr_Wilson::Fopr_Wilson_impl::set_parameters
void set_parameters(const double kappa, const std::valarray< int > bc)

Fopr_Wilson::Fopr_Wilson_impl::gm5_chiral
void gm5_chiral(Field &, const Field &)
Definition: fopr_Wilson_impl.cpp:531

Fopr_Wilson::Fopr_Wilson_impl::proj_chiral
void proj_chiral(Field &w, const int ex1, const Field &v, const int ex2, const int ipm)
Definition: fopr_Wilson_impl.cpp:456

CommonParameters::Ndim
static int Ndim()
Definition: commonParameters.h:104

Fopr_Wilson::Fopr_Wilson_impl::m_Nt
int m_Nt
Definition: fopr_Wilson_impl.h:49

Fopr_Wilson::Fopr_Wilson_impl::vcp1_xp
double * vcp1_xp
arrays for data transfer.
Definition: fopr_Wilson_impl.h:68

Fopr_Wilson::Fopr_Wilson_impl::mult_tm_dirac
void mult_tm_dirac(Field &, const Field &)
Definition: fopr_Wilson_impl.cpp:808

Fopr_Wilson::Fopr_Wilson_impl::vcp1_yp
double * vcp1_yp
Definition: fopr_Wilson_impl.h:69

Bridge::BridgeIO::general
void general(const char *format,...)
Definition: bridgeIO.cpp:38

GammaMatrixSet::get_GM
GammaMatrix get_GM(GMspecies spec)
Definition: gammaMatrixSet.h:69

Fopr_Wilson::Fopr_Wilson_impl::m_w1
Field m_w1
Definition: fopr_Wilson_impl.h:65

CommonParameters::Vlevel
static Bridge::VerboseLevel Vlevel()
Definition: commonParameters.h:109

Field::ptr
double * ptr(const int jin, const int site, const int jex)
Definition: field.h:118

Field
Container of Field-type object.
Definition: field.h:37

Fopr_Wilson::Fopr_Wilson_impl::m_D_ex
void(Fopr_Wilson::Fopr_Wilson_impl::* m_D_ex)(Field &, const int, const Field &, const int)
Definition: fopr_Wilson_impl.h:185

Fopr_Wilson::Fopr_Wilson_impl::D
void D(Field &v, const Field &f)
Definition: fopr_Wilson_impl.h:100

Fopr_Wilson::Fopr_Wilson_impl::vcp1_tp
double * vcp1_tp
Definition: fopr_Wilson_impl.h:71

GammaMatrixSet::GAMMA3
Definition: gammaMatrixSet.h:49

Fopr_Wilson::Fopr_Wilson_impl::vcp2_zm
double * vcp2_zm
Definition: fopr_Wilson_impl.h:70

Fopr_Wilson::Fopr_Wilson_impl::vcp2_tp
double * vcp2_tp
Definition: fopr_Wilson_impl.h:71

Fopr_Wilson::Fopr_Wilson_impl::m_mult_dag
void(Fopr_Wilson::Fopr_Wilson_impl::* m_mult_dag)(Field &, const Field &)
Definition: fopr_Wilson_impl.h:180

Fopr_Wilson::Fopr_Wilson_impl::vcp2_zp
double * vcp2_zp
Definition: fopr_Wilson_impl.h:70

GammaMatrixSet::GAMMA1
Definition: gammaMatrixSet.h:49

Fopr_Wilson::mult_up
void mult_up(int mu, Field &w, const Field &v)
adding the hopping to nearest neighbor site in mu-th direction.
Definition: fopr_Wilson.cpp:156

Fopr_Wilson::Fopr_Wilson_impl::mult_tp_chiral
void mult_tp_chiral(Field &, const Field &)
Definition: fopr_Wilson_impl.cpp:845

Fopr_Wilson::Fopr_Wilson_impl::m_Nvol
int m_Nvol
Definition: fopr_Wilson_impl.h:50

CommonParameters::Nz
static int Nz()
Definition: commonParameters.h:98

Communicator::ipe
static int ipe(const int dir)
logical coordinate of current proc.
Definition: communicator.cpp:104

Fopr_Wilson::Fopr_Wilson_impl::H
void H(Field &w, const Field &f)
Definition: fopr_Wilson_impl.h:130

CommonParameters::Lvol
static int Lvol()
Definition: commonParameters.h:86

Fopr_Wilson::Fopr_Wilson_impl::m_boundary2
std::valarray< double > m_boundary2
b.c. for each node.
Definition: fopr_Wilson_impl.h:55

Fopr_Wilson::Fopr_Wilson_impl::m_Ndf
int m_Ndf
Definition: fopr_Wilson_impl.h:48

Fopr_Wilson::Fopr_Wilson_impl::D_chiral
void D_chiral(Field &, const Field &)
Definition: fopr_Wilson_impl.cpp:244

CommonParameters::Nx
static int Nx()
Definition: commonParameters.h:96

Fopr_Wilson::Fopr_Wilson_impl::vcp2_xp
double * vcp2_xp
Definition: fopr_Wilson_impl.h:68

Fopr_Wilson::Fopr_Wilson_impl::m_Nd
int m_Nd
Definition: fopr_Wilson_impl.h:48

Fopr_Wilson::Fopr_Wilson_impl::m_Ny
int m_Ny
Definition: fopr_Wilson_impl.h:49

ThreadManager_OpenMP::get_thread_id
static int get_thread_id()
returns thread id.
Definition: threadManager_OpenMP.cpp:107

Fopr_Wilson::Fopr_Wilson_impl::mult_xm
void mult_xm(Field &, const Field &)
Definition: fopr_Wilson_impl.cpp:586

Fopr_Wilson::Fopr_Wilson_impl::vcp1_tm
double * vcp1_tm
Definition: fopr_Wilson_impl.h:71

Fopr_Wilson::Fopr_Wilson_impl::vcp2_tm
double * vcp2_tm
Definition: fopr_Wilson_impl.h:71

Fopr_Wilson::Fopr_Wilson_impl::tidyup
void tidyup()
Definition: fopr_Wilson_impl.cpp:153

Fopr_Wilson::Fopr_Wilson_impl::m_Nx
int m_Nx
Definition: fopr_Wilson_impl.h:49

Fopr_Wilson::Fopr_Wilson_impl::DdagD
void DdagD(Field &w, const Field &f)
Definition: fopr_Wilson_impl.h:110

Fopr_Wilson::Fopr_Wilson_impl::m_U
const Field_G * m_U
gauge configuration.
Definition: fopr_Wilson_impl.h:57

Fopr_Wilson::Fopr_Wilson_impl::m_w2
Field m_w2
temporary fields.
Definition: fopr_Wilson_impl.h:65

CommonParameters::Nvol
static int Nvol()
Definition: commonParameters.h:100

Fopr_Wilson::Fopr_Wilson_impl::vcp1_zm
double * vcp1_zm
Definition: fopr_Wilson_impl.h:70

Fopr_Wilson::Fopr_Wilson_impl::clear
void clear(Field &)
Definition: fopr_Wilson_impl.cpp:496

Fopr_Wilson::Fopr_Wilson_impl::get_mode
std::string get_mode() const
Definition: fopr_Wilson_impl.cpp:177

Fopr_Wilson::Fopr_Wilson_impl::m_mult
void(Fopr_Wilson::Fopr_Wilson_impl::* m_mult)(Field &, const Field &)
Definition: fopr_Wilson_impl.h:179

Fopr_Wilson::Fopr_Wilson_impl::m_repr
std::string m_repr
Definition: fopr_Wilson_impl.h:63

Fopr_Wilson::Fopr_Wilson_impl::DDdag
void DDdag(Field &w, const Field &f)
Definition: fopr_Wilson_impl.h:120

Fopr::m_vl
Bridge::VerboseLevel m_vl
Definition: fopr.h:99

Fopr_Wilson::Fopr_Wilson_impl::vcp2_xm
double * vcp2_xm
Definition: fopr_Wilson_impl.h:68

Field::reset
void reset(const int Nin, const int Nvol, const int Nex, const element_type cmpl=COMPLEX)
Definition: field.h:82

Fopr_Wilson::Fopr_Wilson_impl::m_vl
Bridge::VerboseLevel m_vl
Definition: fopr_Wilson_impl.h:60

Fopr_Wilson::Fopr_Wilson_impl::m_GM
std::valarray< GammaMatrix > m_GM
gamma matrices.
Definition: fopr_Wilson_impl.h:58

ThreadManager_OpenMP::sync_barrier_all
static void sync_barrier_all()
barrier among all the threads and nodes.
Definition: threadManager_OpenMP.cpp:141

Fopr_Wilson::Fopr_Wilson_impl::mult_ym
void mult_ym(Field &, const Field &)
Definition: fopr_Wilson_impl.cpp:660

GammaMatrixSet::GAMMA4
Definition: gammaMatrixSet.h:49

Fopr_Wilson::Fopr_Wilson_impl::m_D
void(Fopr_Wilson::Fopr_Wilson_impl::* m_D)(Field &, const Field &)
Definition: fopr_Wilson_impl.h:181

Communicator::exchange
static int exchange(int count, double *recv_buf, double *send_buf, int idir, int ipm, int tag)
receive array of double from upstream specified by idir and ipm, and send array to downstream...
Definition: communicator.cpp:183

GammaMatrixSet
Set of Gamma Matrices: basis class.
Definition: gammaMatrixSet.h:38

Fopr_Wilson::class_name
static const std::string class_name
Definition: fopr_Wilson.h:56

Fopr_Wilson::Fopr_Wilson_impl::m_gm5
void(Fopr_Wilson::Fopr_Wilson_impl::* m_gm5)(Field &, const Field &)
Definition: fopr_Wilson_impl.h:182

CommonParameters::Nt
static int Nt()
Definition: commonParameters.h:99

Fopr_Wilson::Fopr_Wilson_impl::D_ex_chiral
void D_ex_chiral(Field &, const int ex1, const Field &, const int ex2)
Definition: fopr_Wilson_impl.cpp:360

Fopr_Wilson::Fopr_Wilson_impl::D_ex_dirac
void D_ex_dirac(Field &, const int ex1, const Field &, const int ex2)
Definition: fopr_Wilson_impl.cpp:287

Fopr_Wilson::Fopr_Wilson_impl::class_name
static const std::string class_name
Definition: fopr_Wilson_impl.h:44

Fopr_Wilson::Fopr_Wilson_impl::mult_gm5p
const Field_F mult_gm5p(int mu, const Field_F &w)
Definition: fopr_Wilson_impl.h:146

Fopr_Wilson::Fopr_Wilson_impl::flop_count
double flop_count()
Definition: fopr_Wilson_impl.cpp:209

Bridge::BridgeIO::crucial
void crucial(const char *format,...)
Definition: bridgeIO.cpp:26

Fopr_Wilson::Fopr_Wilson_impl::vcp2_ym
double * vcp2_ym
Definition: fopr_Wilson_impl.h:69

Fopr_Wilson::Fopr_Wilson_impl::set_mode
void set_mode(std::string mode)
Definition: fopr_Wilson_impl.cpp:126

Fopr_Wilson::Fopr_Wilson_impl::vcp1_ym
double * vcp1_ym
Definition: fopr_Wilson_impl.h:69

Fopr_Wilson::Fopr_Wilson_impl::m_Nc
int m_Nc
Definition: fopr_Wilson_impl.h:48

Fopr_Wilson::Fopr_Wilson_impl::m_mult_tm
void(Fopr_Wilson::Fopr_Wilson_impl::* m_mult_tm)(Field &, const Field &)
Definition: fopr_Wilson_impl.h:184

CommonParameters::Ny
static int Ny()
Definition: commonParameters.h:97

Fopr_Wilson::Fopr_Wilson_impl::mult_tp_dirac
void mult_tp_dirac(Field &, const Field &)
Definition: fopr_Wilson_impl.cpp:771

Fopr_Wilson::Fopr_Wilson_impl::m_boundary
std::valarray< int > m_boundary
boundary condition.
Definition: fopr_Wilson_impl.h:54

Fopr_Wilson::Fopr_Wilson_impl::mult_up
void mult_up(int mu, Field &, const Field &)
Definition: fopr_Wilson_impl.cpp:250

Fopr_Wilson::Fopr_Wilson_impl::D_dirac
void D_dirac(Field &, const Field &)
Definition: fopr_Wilson_impl.cpp:238

Fopr_Wilson::Fopr_Wilson_impl::mult_zm
void mult_zm(Field &, const Field &)
Definition: fopr_Wilson_impl.cpp:734

Fopr_Wilson::Fopr_Wilson_impl::mult_undef
void mult_undef(Field &, const Field &f)
Definition: fopr_Wilson_impl.h:136

Fopr_Wilson::Fopr_Wilson_impl::m_Nz
int m_Nz
Definition: fopr_Wilson_impl.h:49

Fopr_Wilson::Fopr_Wilson_impl::mult_yp
void mult_yp(Field &, const Field &)
Definition: fopr_Wilson_impl.cpp:623

Field::setpart_ex
void setpart_ex(int ex, const Field &w, int exw)
Definition: field.h:150

Fopr_Wilson::Fopr_Wilson_impl::m_Ndim
int m_Ndim
Definition: fopr_Wilson_impl.h:50

Fopr_Wilson::Fopr_Wilson_impl::setup_thread
void setup_thread()
Definition: fopr_Wilson_impl_thread.cpp:35

Fopr_Wilson::Fopr_Wilson_impl::mult_xp
void mult_xp(Field &, const Field &)
Definition: fopr_Wilson_impl.cpp:549

Fopr_Wilson::Fopr_Wilson_impl::mult_dn
void mult_dn(int mu, Field &, const Field &)
Definition: fopr_Wilson_impl.cpp:269

Fopr_Wilson::Fopr_Wilson_impl::Ddag
void Ddag(Field &w, const Field &f)
Definition: fopr_Wilson_impl.h:103

fopr_Wilson_impl.h

Fopr_Wilson::Fopr_Wilson_impl::init
void init(std::string repr)

Fopr_Wilson::Fopr_Wilson_impl::m_Nvc
int m_Nvc
Definition: fopr_Wilson_impl.h:48

Fopr_Wilson::Fopr_Wilson_impl::m_mult_tp
void(Fopr_Wilson::Fopr_Wilson_impl::* m_mult_tp)(Field &, const Field &)
Definition: fopr_Wilson_impl.h:183

Fopr_Wilson::mult_gm5
const Field mult_gm5(const Field &f)
Definition: fopr_Wilson.h:91

GammaMatrixSet::GAMMA5
Definition: gammaMatrixSet.h:50

Fopr_Wilson::Fopr_Wilson_impl::mult_tm_chiral
void mult_tm_chiral(Field &, const Field &)
Definition: fopr_Wilson_impl.cpp:882

Fopr_Wilson::Fopr_Wilson_impl::gm5_dirac
void gm5_dirac(Field &, const Field &)
Definition: fopr_Wilson_impl.cpp:513

GammaMatrixSet::GAMMA2
Definition: gammaMatrixSet.h:49