16 #ifdef USE_FACTORY_AUTOREGISTER
18 bool init = Solver_BiCGStab_DS_L_Cmplx::register_factory();
27 const string str_vlevel = params.
get_string(
"verbose_level");
36 double Omega_tolerance;
40 err += params.
fetch_int(
"maximum_number_of_iteration", Niter);
41 err += params.
fetch_int(
"maximum_number_of_restart", Nrestart);
42 err += params.
fetch_double(
"convergence_criterion_squared", Stop_cond);
43 err += params.
fetch_bool(
"use_initial_guess", use_init_guess);
44 err += params.
fetch_double(
"Omega_tolerance", Omega_tolerance);
45 err += params.
fetch_int(
"number_of_orthonormal_vectors", N_L);
46 err += params.
fetch_double(
"tolerance_for_DynamicSelection_of_L", Tol_L);
99 vout.
general(
m_vl,
" use_init_guess = %s\n", use_init_guess ?
"true" :
"false");
161 int& Nconv,
double& diff)
163 const double bnorm2 = b.
norm2();
164 const int bsize = b.
size();
170 bool is_converged =
false;
188 Nconv2 += Nconv_unit;
193 for (
int i_restart = 0; i_restart <
m_Nrestart; i_restart++) {
194 for (
int iter = 0; iter <
m_Niter; iter++) {
231 vout.
crucial(
m_vl,
" iter(final): %8d %22.15e\n", Nconv2, diff2 / bnorm2);
241 diff = sqrt(diff2 / bnorm2);
254 const int Nin = b.
nin();
255 const int Nvol = b.
nvol();
256 const int Nex = b.
nex();
268 for (
int i = 0; i <
m_N_L + 1; ++i) {
269 m_u[i].reset(Nin, Nvol, Nex);
270 m_r[i].reset(Nin, Nvol, Nex);
284 for (
int i = 0; i <
m_N_L + 1; ++i) {
318 dcomplex c_Rayleigh_prev = cmplx(0.0, 0.0);
320 bool is_converged_L =
false;
324 if (!is_converged_L) {
328 dcomplex beta = alpha_prev2 * (rho / rho_prev2);
332 for (
int i = 0; i < j + 1; ++i) {
339 alpha_prev2 = rho_prev2 / conj(gamma);
341 for (
int i = 0; i < j + 1; ++i) {
353 double r_tmp =
m_r[j].norm2();
354 dcomplex c_Rayleigh =
dotc(
m_r[j],
m_r[j + 1]) / r_tmp;
356 dcomplex c_E = (c_Rayleigh - c_Rayleigh_prev) / c_Rayleigh;
358 c_Rayleigh_prev = c_Rayleigh;
368 is_converged_L =
true;
374 std::vector<double> sigma(
m_N_L + 1);
375 std::vector<dcomplex> gamma_prime(
m_N_L + 1);
378 std::vector<dcomplex> tau(
m_N_L * (
m_N_L + 1));
380 const double sigma_0 =
m_r[0].norm2();
382 for (
int j = 1; j < N_L_tmp + 1; ++j) {
383 for (
int i = 1; i < j; ++i) {
387 tau[ij] = conj(r_ji) / sigma[i];
391 sigma[j] =
m_r[j].norm2();
394 gamma_prime[j] = conj(r_0j) / sigma[j];
397 double abs_rho = abs(r_0j) / sqrt(sigma[j] * sigma_0);
404 std::vector<dcomplex> gamma(
m_N_L + 1);
405 gamma[N_L_tmp] = gamma_prime[N_L_tmp];
407 for (
int j = N_L_tmp - 1; j > 0; --j) {
408 dcomplex c_tmp = cmplx(0.0, 0.0);
410 for (
int i = j + 1; i < N_L_tmp + 1; ++i) {
412 c_tmp += tau[ji] * gamma[i];
415 gamma[j] = gamma_prime[j] - c_tmp;
420 std::vector<dcomplex> gamma_double_prime(
m_N_L);
422 for (
int j = 1; j < N_L_tmp; ++j) {
423 dcomplex c_tmp = cmplx(0.0, 0.0);
425 for (
int i = j + 1; i < N_L_tmp; ++i) {
427 c_tmp += tau[ji] * gamma[i + 1];
430 gamma_double_prime[j] = gamma[j + 1] + c_tmp;
435 axpy(
m_r[0], -gamma_prime[N_L_tmp],
m_r[N_L_tmp]);
438 for (
int j = 1; j < N_L_tmp; ++j) {
452 m_N_L_prev = N_L_tmp;
467 const int Nin =
m_x.
nin();
469 const int Nex =
m_x.
nex();
478 const double gflop_axpy = (Nin * Nex * 2) * ((Nvol * NPE) / 1.0e+9);
479 const double gflop_dotc = (Nin * Nex * 4) * ((Nvol * NPE) / 1.0e+9);
480 const double gflop_norm = (Nin * Nex * 2) * ((Nvol * NPE) / 1.0e+9);
484 const double gflop_init = gflop_fopr + gflop_axpy + gflop_norm;
485 const double gflop_step_BiCG_part = 2 * N_L_prev_total * gflop_fopr
486 + 3 * N_L_prev_total * gflop_dotc
488 + N_L_prev_total * gflop_norm;
489 const double gflop_step_L_part = (
m_N_L_part_count + N_L_prev_total) * gflop_dotc
492 const double gflop_step = gflop_step_BiCG_part + gflop_step_L_part;
493 const double gflop_true_residual = gflop_fopr + gflop_axpy + gflop_norm;
495 const double gflop = gflop_norm + gflop_init + gflop_step + gflop_true_residual * (
m_Nrestart_count + 1)
void set_parameters_DS_L(const int N_L, const double Tol_L)
int fetch_bool(const string &key, bool &value) const
void detailed(const char *format,...)
static double epsilon_criterion()
void solve_init(const Field &, double &)
void general(const char *format,...)
void reset_field(const Field &)
Container of Field-type object.
int fetch_double(const string &key, double &value) const
void set_parameters_BiCGStab_series(const double Omega_tolerance)
void copy(Field &y, const Field &x)
copy(y, x): y = x
void solve(Field &solution, const Field &source, int &Nconv, double &diff)
int square_non_zero(const double v)
dcomplex dotc(const Field &y, const Field &x)
int fetch_int(const string &key, int &value) const
virtual double flop_count()
returns the flop in giga unit
void aypx(const double a, Field &y, const Field &x)
aypx(y, a, x): y := a * y + x
void solve_step(double &)
void paranoiac(const char *format,...)
void reset(const int Nin, const int Nvol, const int Nex, const element_type cmpl=Element_type::COMPLEX)
void axpy(Field &y, const double a, const Field &x)
axpy(y, a, x): y := a * x + y
void crucial(const char *format,...)
static const std::string class_name
virtual void mult(Field &, const Field &)=0
multiplies fermion operator to a given field (2nd argument)
int non_negative(const int v)
int index_ij(const int i, const int j)
void set_parameters(const Parameters ¶ms)
static void assert_single_thread(const std::string &class_name)
assert currently running on single thread.
string get_string(const string &key) const
Bridge::VerboseLevel m_vl
static VerboseLevel set_verbose_level(const std::string &str)