Flow123d  release_3.0.0-506-g34af125
linsys_PETSC.cc
Go to the documentation of this file.
1 /*!
2  *
3  * Copyright (C) 2015 Technical University of Liberec. All rights reserved.
4  *
5  * This program is free software; you can redistribute it and/or modify it under
6  * the terms of the GNU General Public License version 3 as published by the
7  * Free Software Foundation. (http://www.gnu.org/licenses/gpl-3.0.en.html)
8  *
9  * This program is distributed in the hope that it will be useful, but WITHOUT
10  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
11  * FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details.
12  *
13  *
14  * @file linsys_PETSC.cc
15  * @brief Solver based on the original PETSc solver using MPIAIJ matrix and succesive Schur complement construction
16  * @author Jakub Sistek
17  */
18 
19 // derived from base linsys
20 #include "la/linsys_PETSC.hh"
21 #include "petscvec.h"
22 #include "petscksp.h"
23 #include "petscmat.h"
24 #include "system/sys_profiler.hh"
25 #include "system/system.hh"
26 
27 
28 //#include <boost/bind.hpp>
29 
30 namespace it = Input::Type;
31 
33  return it::Record("Petsc", "Interface to PETSc solvers. Convergence criteria is:\n"
34  "```\n"
35  "norm( res_n ) < max( norm( res_0 ) * r_tol, a_tol )\n"
36  "```\n"
37  "where res_i is the residuum vector after i-th iteration of the solver and res_0 is an estimate of the norm of initial residual. "
38  "If the initial guess of the solution is provided (usually only for transient equations) the residual of this estimate is used, "
39  "otherwise the norm of preconditioned RHS is used. "
40  "The default norm is L2 norm of preconditioned residual: (($ P^{-1}(Ax-b)$)), usage of other norm may be prescribed using the 'option' key. "
41  "See also PETSc documentation for KSPSetNormType.")
43  .declare_key("r_tol", it::Double(0.0, 1.0), it::Default::read_time("Defalut value set by nonlinear solver or equation. If not we use value 1.0e-7."),
44  "Relative residual tolerance, (to initial error).")
45  .declare_key("a_tol", it::Double(0.0), it::Default::read_time("Defalut value set by nonlinear solver or equation. If not we use value 1.0e-11."),
46  "Absolute residual tolerance.")
47  .declare_key("max_it", it::Integer(0), it::Default::read_time("Defalut value set by nonlinear solver or equation. If not we use value 1000."),
48  "Maximum number of outer iterations of the linear solver.")
49  .declare_key("options", it::String(), it::Default("\"\""), "Options passed to PETSC before creating KSP instead of default setting.")
50  .close();
51 }
52 
53 
55 
56 
57 LinSys_PETSC::LinSys_PETSC( const Distribution * rows_ds, const std::string &params)
58  : LinSys( rows_ds ),
59  params_(params),
60  init_guess_nonzero(false),
61  matrix_(0)
62 {
63  // create PETSC vectors:
64  PetscErrorCode ierr;
65  // rhs
66  v_rhs_= new double[ rows_ds_->lsize() + 1 ];
67  ierr = VecCreateMPIWithArray( comm_, 1, rows_ds_->lsize(), PETSC_DECIDE, v_rhs_, &rhs_ ); CHKERRV( ierr );
68  ierr = VecZeroEntries( rhs_ ); CHKERRV( ierr );
69  VecDuplicate(rhs_, &residual_);
70 
71  matrix_ = NULL;
72  solution_precision_ = std::numeric_limits<double>::infinity();
73  matrix_changed_ = true;
74  rhs_changed_ = true;
75 }
76 
78  : LinSys(other), params_(other.params_), v_rhs_(NULL), solution_precision_(other.solution_precision_)
79 {
80  MatCopy(other.matrix_, matrix_, DIFFERENT_NONZERO_PATTERN);
81  VecCopy(other.rhs_, rhs_);
82  VecCopy(other.on_vec_, on_vec_);
83  VecCopy(other.off_vec_, off_vec_);
84 }
85 
86 void LinSys_PETSC::set_tolerances(double r_tol, double a_tol, unsigned int max_it)
87 {
88  if (! in_rec_.is_empty()) {
89  // input record is set
90  r_tol_ = in_rec_.val<double>("r_tol", r_tol);
91  a_tol_ = in_rec_.val<double>("a_tol", a_tol);
92  max_it_ = in_rec_.val<unsigned int>("max_it", max_it);
93  } else {
94  r_tol_ = r_tol;
95  a_tol_ = a_tol;
96  max_it_ = max_it;
97 
98  }
99 }
100 
101 
103 {
104  PetscErrorCode ierr;
105 
106  ierr = VecCreateMPI( comm_, rows_ds_->lsize(), PETSC_DECIDE, &(on_vec_) ); CHKERRV( ierr );
107  ierr = VecDuplicate( on_vec_, &(off_vec_) ); CHKERRV( ierr );
108  status_ = ALLOCATE;
109 }
110 
112 {
113  switch ( status_ ) {
114  case ALLOCATE:
115  this->preallocate_matrix( );
116  break;
117  case INSERT:
118  this->finish_assembly( MAT_FLUSH_ASSEMBLY );
119  break;
120  case ADD:
121  case DONE:
122  break;
123  default:
124  OLD_ASSERT( false, "Can not set values. Matrix is not preallocated.\n");
125  }
126  status_ = ADD;
127 }
128 
130 {
131  switch ( status_ ) {
132  case ALLOCATE:
133  this->preallocate_matrix();
134  break;
135  case ADD:
136  this->finish_assembly( MAT_FLUSH_ASSEMBLY );
137  break;
138  case INSERT:
139  case DONE:
140  break;
141  default:
142  OLD_ASSERT( false, "Can not set values. Matrix is not preallocated.\n");
143  }
144  status_ = INSERT;
145 }
146 
147 void LinSys_PETSC::mat_set_values( int nrow, int *rows, int ncol, int *cols, double *vals )
148 {
149  // here vals would need to be converted from double to PetscScalar if it was ever something else than double :-)
150  switch (status_) {
151  case INSERT:
152  case ADD:
153  chkerr(MatSetValues(matrix_,nrow,rows,ncol,cols,vals,(InsertMode)status_));
154  break;
155  case ALLOCATE:
156  this->preallocate_values(nrow,rows,ncol,cols);
157  break;
158  default: DebugOut() << "LS SetValues with non allowed insert mode.\n";
159  }
160 
161  matrix_changed_ = true;
162 }
163 
164 void LinSys_PETSC::rhs_set_values( int nrow, int *rows, double *vals )
165 {
166  PetscErrorCode ierr;
167 
168  switch (status_) {
169  case INSERT:
170  case ADD:
171  ierr = VecSetValues(rhs_,nrow,rows,vals,(InsertMode)status_); CHKERRV( ierr );
172  break;
173  case ALLOCATE:
174  break;
175  default: OLD_ASSERT(false, "LinSys's status disallow set values.\n");
176  }
177 
178  rhs_changed_ = true;
179 }
180 
181 void LinSys_PETSC::preallocate_values(int nrow,int *rows,int ncol,int *cols)
182 {
183  int i,j;
184  int col;
185  PetscInt row;
186 
187  for (i=0; i<nrow; i++) {
188  row=rows[i];
189  for(j=0; j<ncol; j++) {
190  col = cols[j];
191  if (rows_ds_->get_proc(row) == rows_ds_->get_proc(col))
192  VecSetValue(on_vec_,row,1.0,ADD_VALUES);
193  else
194  VecSetValue(off_vec_,row,1.0,ADD_VALUES);
195  }
196  }
197 }
198 
200 {
201  OLD_ASSERT(status_ == ALLOCATE, "Linear system has to be in ALLOCATE status.");
202 
203  PetscErrorCode ierr;
204  PetscInt *on_nz, *off_nz;
205  PetscScalar *on_array, *off_array;
206 
207  // assembly and get values from counting vectors, destroy them
208  VecAssemblyBegin(on_vec_);
209  VecAssemblyBegin(off_vec_);
210 
211  on_nz = new PetscInt[ rows_ds_->lsize() ];
212  off_nz = new PetscInt[ rows_ds_->lsize() ];
213 
214  VecAssemblyEnd(on_vec_);
215  VecAssemblyEnd(off_vec_);
216 
217  VecGetArray( on_vec_, &on_array );
218  VecGetArray( off_vec_, &off_array );
219 
220  for ( unsigned int i=0; i<rows_ds_->lsize(); i++ ) {
221  on_nz[i] = std::min( rows_ds_->lsize(), static_cast<uint>( on_array[i]+0.1 ) ); // small fraction to ensure correct rounding
222  off_nz[i] = std::min( rows_ds_->size() - rows_ds_->lsize(), static_cast<uint>( off_array[i]+0.1 ) );
223  }
224 
225  VecRestoreArray(on_vec_,&on_array);
226  VecRestoreArray(off_vec_,&off_array);
227  VecDestroy(&on_vec_);
228  VecDestroy(&off_vec_);
229 
230  // create PETSC matrix with preallocation
231  if (matrix_ != NULL)
232  {
233  chkerr(MatDestroy(&matrix_));
234  }
235  ierr = MatCreateAIJ(PETSC_COMM_WORLD, rows_ds_->lsize(), rows_ds_->lsize(), PETSC_DETERMINE, PETSC_DETERMINE,
236  0, on_nz, 0, off_nz, &matrix_); CHKERRV( ierr );
237 
238  if (symmetric_) MatSetOption(matrix_, MAT_SYMMETRIC, PETSC_TRUE);
239  MatSetOption(matrix_, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE);
240  MatSetOption(matrix_, MAT_IGNORE_ZERO_ENTRIES, PETSC_TRUE);
241 
242  delete[] on_nz;
243  delete[] off_nz;
244 }
245 
247 {
248  MatAssemblyType assemblyType = MAT_FINAL_ASSEMBLY;
249  this->finish_assembly( assemblyType );
250 }
251 
252 void LinSys_PETSC::finish_assembly( MatAssemblyType assembly_type )
253 {
254  PetscErrorCode ierr;
255 
256  if (status_ == ALLOCATE) {
257  WarningOut() << "Finalizing linear system without setting values.\n";
258  this->preallocate_matrix();
259  }
260  ierr = MatAssemblyBegin(matrix_, assembly_type); CHKERRV( ierr );
261  ierr = VecAssemblyBegin(rhs_); CHKERRV( ierr );
262  ierr = MatAssemblyEnd(matrix_, assembly_type); CHKERRV( ierr );
263  ierr = VecAssemblyEnd(rhs_); CHKERRV( ierr );
264 
265  if (assembly_type == MAT_FINAL_ASSEMBLY) status_ = DONE;
266 
267  //PetscViewerPushFormat(PETSC_VIEWER_STDOUT_SELF, PETSC_VIEWER_ASCII_INDEX);
268  //MatView(matrix_, PETSC_VIEWER_STDOUT_SELF);
269  //VecView(rhs_, PETSC_VIEWER_STDOUT_SELF);
270  //this->view();
271 
272  matrix_changed_ = true;
273  rhs_changed_ = true;
274 }
275 
276 void LinSys_PETSC::apply_constrains( double scalar )
277 {
278  PetscErrorCode ierr;
279 
280  // check that system matrix is assembled
281  OLD_ASSERT ( status_ == DONE, "System matrix and right-hand side are not assembled when applying constraints." );
282 
283  // number of constraints
284  PetscInt numConstraints = static_cast<PetscInt>( constraints_.size() );
285 
286  // Additional multiplier for numerical reasons (criterion to be established)
287  const PetscScalar diagScalar = static_cast<PetscScalar>( scalar );
288 
289  std::vector<PetscInt> globalDofs;
291 
292  // Constraint iterators
293  ConstraintVec_::const_iterator cIter = constraints_.begin( );
294  ConstraintVec_::const_iterator cEnd = constraints_.end( );
295  // collect global dof indices and the correpsonding values
296  for ( ; cIter != cEnd; ++cIter ) {
297  globalDofs.push_back( static_cast<PetscInt>( cIter -> first ) );
298  values.push_back( static_cast<PetscScalar>( cIter -> second ) * diagScalar );
299  }
300 
301  // prepare pointers to be passed to PETSc
302  PetscInt * globalDofPtr = this->makePetscPointer_( globalDofs );
303  PetscScalar * valuePtr = this->makePetscPointer_( values );
304 
305  // set matrix rows to zero
306  ierr = MatZeroRows( matrix_, numConstraints, globalDofPtr, diagScalar, PETSC_NULL, PETSC_NULL ); CHKERRV( ierr );
307  matrix_changed_ = true;
308 
309  // set RHS entries to values (crashes if called with NULL pointers)
310  if ( numConstraints ) {
311  ierr = VecSetValues( rhs_, numConstraints, globalDofPtr, valuePtr, INSERT_VALUES ); CHKERRV( ierr );
312  rhs_changed_ = true;
313  }
314 
315  // perform communication in the rhs vector
316  ierr = VecAssemblyBegin( rhs_ ); CHKERRV( ierr );
317  ierr = VecAssemblyEnd( rhs_ ); CHKERRV( ierr );
318 }
319 
320 
322 {
323  init_guess_nonzero = set_nonzero;
324 }
325 
326 
328 {
329 
330  const char *petsc_dflt_opt;
331  int nits;
332 
333  // -mat_no_inode ... inodes are usefull only for
334  // vector problems e.g. MH without Schur complement reduction
335 
336  /* Comment to PETSc options:
337  *
338  * -ksp_diagonal_scale scales the matrix before solution, while -ksp_diagonal_scale_fix just fixes the scaling after solution
339  * -pc_asm_type basic enforces classical Schwartz method, which seems more stable for positive definite systems.
340  * The default 'restricted' probably violates s.p.d. structure, many tests fail.
341  */
342  if (rows_ds_->np() > 1) {
343  // parallel setting
344  if (this->is_positive_definite())
345  petsc_dflt_opt="-ksp_type cg -ksp_diagonal_scale -ksp_diagonal_scale_fix -pc_type asm -pc_asm_type basic -pc_asm_overlap 4 -sub_pc_type icc -sub_pc_factor_levels 3 -sub_pc_factor_fill 6.0";
346  //petsc_dflt_opt="-ksp_type bcgs -ksp_diagonal_scale_fix -pc_type asm -pc_asm_overlap 4 -sub_pc_type ilu -sub_pc_factor_levels 3 -sub_pc_factor_fill 6.0";
347  else
348  petsc_dflt_opt="-ksp_type bcgs -ksp_diagonal_scale -ksp_diagonal_scale_fix -pc_type asm -pc_asm_overlap 4 -sub_pc_type ilu -sub_pc_factor_levels 3 -sub_pc_factor_fill 6.0";
349 
350  }
351  else {
352  // serial setting
353  if (this->is_positive_definite())
354  petsc_dflt_opt="-ksp_type cg -pc_type icc -pc_factor_levels 3 -ksp_diagonal_scale -ksp_diagonal_scale_fix -pc_factor_fill 6.0";
355  //petsc_dflt_opt="-ksp_type bcgs -pc_type ilu -pc_factor_levels 5 -ksp_diagonal_scale_fix -pc_factor_fill 6.0";
356  else
357  petsc_dflt_opt="-ksp_type bcgs -pc_type ilu -pc_factor_levels 5 -ksp_diagonal_scale -ksp_diagonal_scale_fix -pc_factor_fill 6.0";
358  }
359 
360  if (params_ == "") params_ = petsc_dflt_opt;
361  LogOut().fmt("inserting petsc options: {}\n",params_.c_str());
362 
363  // now takes an optional PetscOptions object as the first argument
364  // value NULL will preserve previous behaviour previous behavior.
365  PetscOptionsInsertString(NULL, params_.c_str()); // overwrites previous options values
366 
367  MatSetOption( matrix_, MAT_USE_INODES, PETSC_FALSE );
368 
369  chkerr(KSPCreate( comm_, &system ));
370  chkerr(KSPSetOperators(system, matrix_, matrix_));
371 
372 
373  // TODO take care of tolerances - shall we support both input file and command line petsc setting
374  chkerr(KSPSetTolerances(system, r_tol_, a_tol_, PETSC_DEFAULT,PETSC_DEFAULT));
375  chkerr(KSPSetTolerances(system, r_tol_, a_tol_, PETSC_DEFAULT, max_it_));
376  KSPSetFromOptions(system);
377  // We set the KSP flag set_initial_guess_nonzero
378  // unless KSP type is preonly.
379  // In such case PETSc fails (version 3.4.1)
380  if (init_guess_nonzero)
381  {
382  KSPType type;
383  KSPGetType(system, &type);
384  if (strcmp(type, KSPPREONLY) != 0)
385  KSPSetInitialGuessNonzero(system, PETSC_TRUE);
386  }
387 
388  {
389  START_TIMER("PETSC linear solver");
390  START_TIMER("PETSC linear iteration");
391  chkerr(KSPSolve(system, rhs_, solution_ ));
392  KSPGetConvergedReason(system,&reason);
393  KSPGetIterationNumber(system,&nits);
394  ADD_CALLS(nits);
395  }
396  // substitute by PETSc call for residual
397  VecNorm(rhs_, NORM_2, &residual_norm_);
398 
399  LogOut().fmt("convergence reason {}, number of iterations is {}\n", reason, nits);
400 
401  // get residual norm
402  KSPGetResidualNorm(system, &solution_precision_);
403 
404  // TODO: I do not understand this
405  //Profiler::instance()->set_timer_subframes("SOLVING MH SYSTEM", nits);
406 
407  chkerr(KSPDestroy(&system));
408 
409  return LinSys::SolveInfo(static_cast<int>(reason), static_cast<int>(nits));
410 
411 }
412 
414 {
415  std::string matFileName = "flow123d_matrix.m";
416  std::string rhsFileName = "flow123d_rhs.m";
417  std::string solFileName = "flow123d_sol.m";
418 
419  PetscViewer myViewer;
420 
421  PetscViewerASCIIOpen(comm_,matFileName.c_str(),&myViewer);
422  PetscViewerSetFormat(myViewer,PETSC_VIEWER_ASCII_MATLAB);
423  MatView( matrix_, myViewer );
424  PetscViewerDestroy(&myViewer);
425 
426  PetscViewerASCIIOpen(comm_,rhsFileName.c_str(),&myViewer);
427  PetscViewerSetFormat(myViewer,PETSC_VIEWER_ASCII_MATLAB);
428  VecView( rhs_, myViewer );
429  PetscViewerDestroy(&myViewer);
430 
431  if ( solution_ != NULL ) {
432  PetscViewerASCIIOpen(comm_,solFileName.c_str(),&myViewer);
433  PetscViewerSetFormat(myViewer,PETSC_VIEWER_ASCII_MATLAB);
434  VecView( solution_, myViewer );
435  PetscViewerDestroy(&myViewer);
436  }
437 }
438 
440 {
441  if (matrix_ != NULL) { chkerr(MatDestroy(&matrix_)); }
442  chkerr(VecDestroy(&rhs_));
443 
444  if (residual_ != NULL) chkerr(VecDestroy(&residual_));
445  if (v_rhs_ != NULL) delete[] v_rhs_;
446 }
447 
448 
449 
451 {
452  LinSys::set_from_input( in_rec );
453 
454  // PETSC specific parameters
455  // If parameters are specified in input file, they are used,
456  // otherwise keep settings provided in constructor of LinSys_PETSC.
457  std::string user_params = in_rec.val<string>("options");
458  if (user_params != "") params_ = user_params;
459 }
460 
461 
463 {
464  return solution_precision_;
465 }
466 
467 
469 {
470  MatMult(matrix_, solution_, residual_);
471  VecAXPY(residual_,-1.0, rhs_);
472  double residual_norm;
473  VecNorm(residual_, NORM_2, &residual_norm);
474  return residual_norm;
475 }
unsigned int size() const
get global size
unsigned int get_proc(unsigned int idx) const
get processor of the given index
SetValuesMode status_
Set value status of the linear system.
Definition: linsys.hh:630
void apply_constrains(double scalar=1.) override
unsigned int uint
unsigned int size() const
Returns number of keys in the Record.
Definition: type_record.hh:598
Solver based on the original PETSc solver using MPIAIJ matrix and succesive Schur complement construc...
virtual void set_from_input(const Input::Record in_rec)
Definition: linsys.hh:602
bool matrix_changed_
true if the matrix was changed since the last solve
Definition: linsys.hh:642
double * v_rhs_
local RHS array pointing to Vec rhs_
Class Input::Type::Default specifies default value of keys of a Input::Type::Record.
Definition: type_record.hh:61
void set_from_input(const Input::Record in_rec) override
LinSys::SolveInfo solve() override
bool symmetric_
Definition: linsys.hh:637
ConstraintVec_ constraints_
Definition: linsys.hh:651
Vec rhs_
PETSc vector constructed with vx array.
void chkerr(unsigned int ierr)
Replacement of new/delete operator in the spirit of xmalloc.
Definition: system.hh:147
#define ADD_CALLS(n_calls)
Increase number of calls in actual timer.
void start_allocation() override
Class for declaration of the integral input data.
Definition: type_base.hh:490
void preallocate_values(int nrow, int *rows, int ncol, int *cols)
Input::Record in_rec_
Definition: linsys.hh:655
void start_add_assembly() override
#define LogOut()
Macro defining &#39;log&#39; record of log.
Definition: logger.hh:249
bool rhs_changed_
true if the right hand side was changed since the last solve
Definition: linsys.hh:643
Record & close() const
Close the Record for further declarations of keys.
Definition: type_record.cc:303
double get_solution_precision() override
void start_insert_assembly() override
virtual Record & derive_from(Abstract &parent)
Method to derive new Record from an AbstractRecord parent.
Definition: type_record.cc:195
#define OLD_ASSERT(...)
Definition: global_defs.h:131
Class for declaration of the input data that are floating point numbers.
Definition: type_base.hh:541
MPI_Comm comm_
Definition: linsys.hh:629
unsigned int max_it_
maximum number of iterations of linear solver
Definition: linsys.hh:627
T * makePetscPointer_(std::vector< T > &array)
LinSys_PETSC(const Distribution *rows_ds, const std::string &params="")
Definition: linsys_PETSC.cc:57
Accessor to the data with type Type::Record.
Definition: accessors.hh:292
const Ret val(const string &key) const
#define START_TIMER(tag)
Starts a timer with specified tag.
const Distribution * rows_ds_
final distribution of rows of MH matrix
Definition: linsys.hh:635
double a_tol_
absolute tolerance of linear solver
Definition: linsys.hh:626
Record & declare_key(const string &key, std::shared_ptr< TypeBase > type, const Default &default_value, const string &description, TypeBase::attribute_map key_attributes=TypeBase::attribute_map())
Declares a new key of the Record.
Definition: type_record.cc:501
bool is_empty() const
Definition: accessors.hh:366
unsigned int np() const
get num of processors
double residual_norm_
local solution array pointing into Vec solution_
Definition: linsys.hh:649
Vec on_vec_
Vectors for counting non-zero entries in diagonal block.
void preallocate_matrix()
double compute_residual() override
std::string params_
command-line-like options for the PETSc solver
static Default read_time(const std::string &description)
The factory function to make an default value that will be specified at the time when a key will be r...
Definition: type_record.hh:97
KSPConvergedReason reason
Vec off_vec_
Vectors for counting non-zero entries in off-diagonal block.
double r_tol_
relative tolerance of linear solver
Definition: linsys.hh:625
void finish_assembly() override
void view() override
void rhs_set_values(int nrow, int *rows, double *vals) override
bool is_positive_definite()
Definition: linsys.hh:558
#define WarningOut()
Macro defining &#39;warning&#39; record of log.
Definition: logger.hh:246
void set_initial_guess_nonzero(bool set_nonzero=true)
static const Input::Type::Record & get_input_type()
Definition: linsys_PETSC.cc:32
void set_tolerances(double r_tol, double a_tol, unsigned int max_it) override
Definition: linsys_PETSC.cc:86
Mat matrix_
Petsc matrix of the problem.
static const int registrar
Registrar of class to factory.
Record type proxy class.
Definition: type_record.hh:182
void mat_set_values(int nrow, int *rows, int ncol, int *cols, double *vals) override
static Input::Type::Abstract & get_input_type()
Definition: linsys.cc:29
bool init_guess_nonzero
flag for starting from nonzero guess
#define DebugOut()
Macro defining &#39;debug&#39; record of log.
Definition: logger.hh:252
Class for declaration of the input data that are in string format.
Definition: type_base.hh:589
Vec solution_
PETSc vector constructed with vb array.
Definition: linsys.hh:645
double solution_precision_
unsigned int lsize(int proc) const
get local size