doxygen/src/cs__sles__it__priv_8h_source.html

 #ifndef __CS_SLES_IT_PRIV_H__
 #define __CS_SLES_IT_PRIV_H__

 /*============================================================================
  * Sparse Linear Equation Solvers: private elements.
  *
  * These elements are shared between iterative solvers and smoother
  * both for host and device implementations, but are not accessible to
  * calling code.
  *============================================================================*/

 /*
   This file is part of code_saturne, a general-purpose CFD tool.

   Copyright (C) 1998-2022 EDF S.A.

   This program is free software; you can redistribute it and/or modify it under
   the terms of the GNU General Public License as published by the Free Software
   Foundation; either version 2 of the License, or (at your option) any later
   version.

   This program is distributed in the hope that it will be useful, but WITHOUT
   ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
   FOR A PARTICULAR PURPOSE.  See the GNU General Public License for more
   details.

   You should have received a copy of the GNU General Public License along with
   this program; if not, write to the Free Software Foundation, Inc., 51 Franklin
   Street, Fifth Floor, Boston, MA 02110-1301, USA.
 */

 /*----------------------------------------------------------------------------*/

 #include "cs_defs.h"

 /*----------------------------------------------------------------------------
  * Standard C library headers
  *----------------------------------------------------------------------------*/

 #include <stdarg.h>
 #include <stdio.h>
 #include <stdlib.h>
 #include <string.h>
 #include <assert.h>
 #include <math.h>

 #if defined(HAVE_MPI)
 #include <mpi.h>
 #endif

 /*----------------------------------------------------------------------------
  * Local headers
  *----------------------------------------------------------------------------*/

 #include "bft_mem.h"
 #include "bft_error.h"
 #include "bft_printf.h"

 #include "cs_base.h"
 #include "cs_blas.h"
 #include "cs_file.h"
 #include "cs_log.h"
 #include "cs_halo.h"
 #include "cs_mesh.h"
 #include "cs_matrix.h"
 #include "cs_matrix_default.h"
 #include "cs_matrix_util.h"
 #include "cs_post.h"
 #include "cs_timer.h"
 #include "cs_time_plot.h"

 /*----------------------------------------------------------------------------
  *  Header for the current file
  *----------------------------------------------------------------------------*/

 #include "cs_sles.h"
 #include "cs_sles_it.h"
 #include "cs_sles_pc.h"

 /*----------------------------------------------------------------------------*/

 BEGIN_C_DECLS

 /*=============================================================================
  * Local Macro Definitions
  *============================================================================*/

 #if !defined(HUGE_VAL)
 #define HUGE_VAL  1.E+12
 #endif

 #define DB_SIZE_MAX 9

 /*=============================================================================
  * Local Structure Definitions
  *============================================================================*/

 /*----------------------------------------------------------------------------
  * Function pointer for actual resolution of a linear system.
  *
  * parameters:
  *   c             <-- pointer to solver context info
  *   a             <-- linear equation matrix
  *   convergence   <-- convergence information structure
  *   rhs           <-- right hand side
  *   vx            --> system solution
  *   aux_size      <-- number of elements in aux_vectors (in bytes)
  *   aux_vectors   --- optional working area (allocation otherwise)
  *
  * returns:
  *   convergence status
  *----------------------------------------------------------------------------*/

 typedef cs_sles_convergence_state_t
 (cs_sles_it_solve_t) (cs_sles_it_t              *c,
                       const cs_matrix_t         *a,
                       cs_lnum_t                  diag_block_size,
                       cs_sles_it_convergence_t  *convergence,
                       const cs_real_t           *rhs,
                       cs_real_t                 *restrict vx,
                       size_t                     aux_size,
                       void                      *aux_vectors);

 /* Solver setup data */
 /*-------------------*/

 typedef struct _cs_sles_it_setup_t {

   double               initial_residue;  /* last initial residue value */

   cs_lnum_t            n_rows;           /* number of associated rows */

   const cs_real_t     *ad_inv;           /* pointer to diagonal inverse */
   cs_real_t           *_ad_inv;          /* private pointer to
                                             diagonal inverse */

   void                *pc_context;       /* preconditioner context */
   cs_sles_pc_apply_t  *pc_apply;         /* preconditioner apply */

 } cs_sles_it_setup_t;

 /* Solver additional data */
 /*------------------------*/

 typedef struct _cs_sles_it_add_t {

   cs_lnum_t           *order;            /* ordering */

 } cs_sles_it_add_t;

 /* Basic per linear system options and logging */
 /*---------------------------------------------*/

 struct _cs_sles_it_t {

   /* Base settings */

   cs_sles_it_type_t    type;               /* Solver type */

   bool                 on_device;          /* SpMV on device ? */

   bool                 update_stats;       /* do stats need to be updated ? */
   bool                 ignore_convergence; /* ignore convergence for some
                                               solvers used as preconditioners */

   int                  n_max_iter;         /* maximum number of iterations */
   int                  restart_interval;   /* maximum number of iterations
                                               before restarting the algorithm
                                               (only applicable for GMRES or GCR
                                               algorithm up to now) */

   cs_sles_it_solve_t  *solve;              /* pointer to solve function */

   cs_sles_pc_t        *pc;                 /* pointer to possibly shared
                                               preconditioner object */
   cs_sles_pc_t        *_pc;                /* pointer to owned
                                               preconditioner object */

   /* Performance data */

   unsigned             n_setups;           /* Number of times system setup */
   unsigned             n_solves;           /* Number of times system solved */

   unsigned             n_iterations_last;  /* Number of iterations for last
                                               system resolution */
   unsigned             n_iterations_min;   /* Minimum number ot iterations
                                               in system resolution history */
   unsigned             n_iterations_max;   /* Maximum number ot iterations
                                               in system resolution history */
   unsigned long long   n_iterations_tot;   /* Total accumulated number of
                                               iterations */

   cs_timer_counter_t   t_setup;            /* Total setup */
   cs_timer_counter_t   t_solve;            /* Total time used */

   /* Plot info */

   int                  plot_time_stamp;    /* Plot time stamp */
   cs_time_plot_t      *plot;               /* Pointer to plot structure,
                                               which may be owned or shared */
   cs_time_plot_t      *_plot;              /* Pointer to own plot structure */

   /* Communicator used for reduction operations
      (if left at NULL, main communicator will be used) */

 # if defined(HAVE_MPI)
   MPI_Comm comm;
   MPI_Comm caller_comm;
   int      caller_n_ranks;
 # endif

   /* Solver setup */

   const struct _cs_sles_it_t  *shared;     /* pointer to context sharing some
                                               setup and preconditioner data,
                                               or NULL */

   cs_sles_it_add_t            *add_data;   /* additional data */

   cs_sles_it_setup_t          *setup_data; /* setup data */

   /* Alternative solvers (fallback or heuristics) */

   cs_sles_convergence_state_t  fallback_cvg;  /* threshold for fallback
                                                  convergence */
   cs_sles_it_t                *fallback;   /* fallback solver */

 };

 /* Convergence testing and tracking */
 /*----------------------------------*/

 struct _cs_sles_it_convergence_t {

   const char          *name;               /* Pointer to name string */

   int                  verbosity;          /* Verbosity level */

   unsigned             n_iterations;       /* Current number of iterations */
   unsigned             n_iterations_max;   /* Maximum number of iterations */

   double               precision;          /* Precision limit */
   double               r_norm;             /* Residue normalization */
   double               residue;            /* Current residue */

 };

 /*============================================================================
  * Inline static function definitions
  *============================================================================*/

 /*----------------------------------------------------------------------------
  * Compute dot product, summing result over all ranks.
  *
  * parameters:
  *   c      <-- pointer to solver context info
  *   x      <-- first vector in s = x.y
  *   y      <-- second vector in s = x.y
  *
  * returns:
  *   result of s = x.y
  *----------------------------------------------------------------------------*/

 inline static double
 _dot_product(const cs_sles_it_t  *c,
              const cs_real_t     *x,
              const cs_real_t     *y)
 {
   double s = cs_dot(c->setup_data->n_rows, x, y);

 #if defined(HAVE_MPI)

   if (c->comm != MPI_COMM_NULL) {
     double _sum;
     MPI_Allreduce(&s, &_sum, 1, MPI_DOUBLE, MPI_SUM, c->comm);
     s = _sum;
   }

 #endif /* defined(HAVE_MPI) */

   return s;
 }

 /*----------------------------------------------------------------------------
  * Compute dot product x.x, summing result over all ranks.
  *
  * parameters:
  *   c      <-- pointer to solver context info
  *   x      <-- vector in s = x.x
  *
  * returns:
  *   result of s = x.x
  *----------------------------------------------------------------------------*/

 inline static double
 _dot_product_xx(const cs_sles_it_t  *c,
                 const cs_real_t     *x)
 {
   double s;

   s = cs_dot_xx(c->setup_data->n_rows, x);

 #if defined(HAVE_MPI)

   if (c->comm != MPI_COMM_NULL) {
     double _sum;
     MPI_Allreduce(&s, &_sum, 1, MPI_DOUBLE, MPI_SUM, c->comm);
     s = _sum;
   }

 #endif /* defined(HAVE_MPI) */

   return s;
 }

 /*----------------------------------------------------------------------------
  * Compute 2 dot products x.x and x.y, summing result over all ranks.
  *
  * parameters:
  *   c      <-- pointer to solver context info
  *   x      <-- vector in s1 = x.x and s2 = x.y
  *   y      <-- vector in s2 = x.y
  *   s1     --> result of s1 = x.x
  *   s2     --> result of s2 = x.y
  *----------------------------------------------------------------------------*/

 inline static void
 _dot_products_xx_xy(const cs_sles_it_t  *c,
                     const cs_real_t     *x,
                     const cs_real_t     *y,
                     double              *s1,
                     double              *s2)
 {
   double s[2];

   cs_dot_xx_xy(c->setup_data->n_rows, x, y, s, s+1);

 #if defined(HAVE_MPI)

   if (c->comm != MPI_COMM_NULL) {
     double _sum[2];
     MPI_Allreduce(s, _sum, 2, MPI_DOUBLE, MPI_SUM, c->comm);
     s[0] = _sum[0];
     s[1] = _sum[1];
   }

 #endif /* defined(HAVE_MPI) */

   *s1 = s[0];
   *s2 = s[1];
 }

 /*----------------------------------------------------------------------------
  * Compute 2 dot products x.x and x.y, summing result over all ranks.
  *
  * parameters:
  *   c      <-- pointer to solver context info
  *   x      <-- vector in s1 = x.y
  *   y      <-- vector in s1 = x.y and s2 = y.z
  *   z      <-- vector in s2 = y.z
  *   s1     --> result of s1 = x.y
  *   s2     --> result of s2 = y.z
  *----------------------------------------------------------------------------*/

 inline static void
 _dot_products_xy_yz(const cs_sles_it_t  *c,
                     const cs_real_t     *x,
                     const cs_real_t     *y,
                     const cs_real_t     *z,
                     double              *s1,
                     double              *s2)
 {
   double s[2];

   cs_dot_xy_yz(c->setup_data->n_rows, x, y, z, s, s+1);

 #if defined(HAVE_MPI)

   if (c->comm != MPI_COMM_NULL) {
     double _sum[2];
     MPI_Allreduce(s, _sum, 2, MPI_DOUBLE, MPI_SUM, c->comm);
     s[0] = _sum[0];
     s[1] = _sum[1];
   }

 #endif /* defined(HAVE_MPI) */

   *s1 = s[0];
   *s2 = s[1];
 }

 /*----------------------------------------------------------------------------
  * Compute 3 dot products, summing result over all ranks.
  *
  * parameters:
  *   c      <-- pointer to solver context info
  *   x      <-- first vector
  *   y      <-- second vector
  *   z      <-- third vector
  *   s1     --> result of s1 = x.x
  *   s2     --> result of s2 = x.y
  *   s3     --> result of s3 = y.z
  *----------------------------------------------------------------------------*/

 inline static void
 _dot_products_xx_xy_yz(const cs_sles_it_t  *c,
                        const cs_real_t     *x,
                        const cs_real_t     *y,
                        const cs_real_t     *z,
                        double              *s1,
                        double              *s2,
                        double              *s3)
 {
   double s[3];

   cs_dot_xx_xy_yz(c->setup_data->n_rows, x, y, z, s, s+1, s+2);

 #if defined(HAVE_MPI)

   if (c->comm != MPI_COMM_NULL) {
     double _sum[3];

     MPI_Allreduce(s, _sum, 3, MPI_DOUBLE, MPI_SUM, c->comm);
     s[0] = _sum[0];
     s[1] = _sum[1];
     s[2] = _sum[2];
   }

 #endif /* defined(HAVE_MPI) */

   *s1 = s[0];
   *s2 = s[1];
   *s3 = s[2];
 }

 /*----------------------------------------------------------------------------
  * Compute 5 dot products, summing result over all ranks.
  *
  * parameters:
  *   c      <-- pointer to solver context info
  *   x      <-- first vector
  *   y      <-- second vector
  *   z      <-- third vector
  *   xx     --> result of x.x
  *   yy     --> result of y.y
  *   xy     --> result of x.y
  *   xz     --> result of x.z
  *   yz     --> result of y.z
  *----------------------------------------------------------------------------*/

 inline static void
 _dot_products_xx_yy_xy_xz_yz(const cs_sles_it_t  *c,
                              const cs_real_t     *x,
                              const cs_real_t     *y,
                              const cs_real_t     *z,
                              double              *xx,
                              double              *yy,
                              double              *xy,
                              double              *xz,
                              double              *yz)
 {
   double s[5];

   cs_dot_xx_yy_xy_xz_yz(c->setup_data->n_rows, x, y, z, s, s+1, s+2, s+3, s+4);

 #if defined(HAVE_MPI)

   if (c->comm != MPI_COMM_NULL) {
     double _sum[5];
     MPI_Allreduce(s, _sum, 5, MPI_DOUBLE, MPI_SUM, c->comm);
     memcpy(s, _sum, 5*sizeof(double));
   }

 #endif /* defined(HAVE_MPI) */

   *xx = s[0];
   *yy = s[1];
   *xy = s[2];
   *xz = s[3];
   *yz = s[4];
 }

 /*----------------------------------------------------------------------------
  * Compute 4 dot products, summing result over all ranks.
  *
  * parameters:
  *   c      <-- pointer to solver context info
  *   v      <-- first vector
  *   r      <-- second vector
  *   w      <-- third vector
  *   q      <-- fourth vector
  *   s1     --> result of s1 = v.r
  *   s2     --> result of s2 = v.w
  *   s3     --> result of s3 = v.q
  *   s4     --> result of s4 = r.r
  *----------------------------------------------------------------------------*/

 inline static void
 _dot_products_vr_vw_vq_rr(const cs_sles_it_t  *c,
                           const cs_real_t     *v,
                           const cs_real_t     *r,
                           const cs_real_t     *w,
                           const cs_real_t     *q,
                           double              *s1,
                           double              *s2,
                           double              *s3,
                           double              *s4)
 {
   double s[4];

   /* Use two separate call as cs_blas.c does not yet hav matching call */

   cs_dot_xy_yz(c->setup_data->n_rows, w, v, q, s+1, s+2);
   cs_dot_xx_xy(c->setup_data->n_rows, r, v, s+3, s);

 #if defined(HAVE_MPI)

   if (c->comm != MPI_COMM_NULL) {
     double _sum[4];
     MPI_Allreduce(s, _sum, 4, MPI_DOUBLE, MPI_SUM, c->comm);
     memcpy(s, _sum, 4*sizeof(double));
   }

 #endif /* defined(HAVE_MPI) */

   *s1 = s[0];
   *s2 = s[1];
   *s3 = s[2];
   *s4 = s[3];
 }

 /*----------------------------------------------------------------------------
  * Block Jacobi utilities.
  * Compute forward and backward to solve an LU 3*3 system.
  *
  * parameters:
  *   mat   <-- 3*3*dim matrix
  *   x     --> solution
  *   b     --> 1st part of RHS (c - b)
  *   c     --> 2nd part of RHS (c - b)
  *----------------------------------------------------------------------------*/

 inline static void
 _fw_and_bw_lu33(const cs_real_t  mat[],
                 cs_real_t        x[restrict],
                 const cs_real_t  b[restrict],
                 const cs_real_t  c[restrict])
 {
   cs_real_t  aux[3];

   aux[0] = (c[0] - b[0]);
   aux[1] = (c[1] - b[1]) - aux[0]*mat[3];
   aux[2] = (c[2] - b[2]) - aux[0]*mat[6] - aux[1]*mat[7];

   x[2] = aux[2]/mat[8];
   x[1] = (aux[1] - mat[5]*x[2])/mat[4];
   x[0] = (aux[0] - mat[1]*x[1] - mat[2]*x[2])/mat[0];
 }

 /*----------------------------------------------------------------------------
  * Block Jacobi utilities.
  * Compute forward and backward to solve an LU P*P system.
  *
  * parameters:
  *   mat     <-- P*P*dim matrix
  *   db_size <-- matrix size
  *   x       --> solution
  *   b       --> 1st part of RHS (c - b)
  *   c       --> 2nd part of RHS (c - b)
  *----------------------------------------------------------------------------*/

 inline static void
 _fw_and_bw_lu(const cs_real_t  mat[],
               int              db_size,
               cs_real_t        x[restrict],
               const cs_real_t  b[restrict],
               const cs_real_t  c[restrict])
 {
   assert(db_size <= DB_SIZE_MAX);
   cs_real_t aux[DB_SIZE_MAX];

   /* forward */
   for (int ii = 0; ii < db_size; ii++) {
     aux[ii] = (c[ii] - b[ii]);
     for (int jj = 0; jj < ii; jj++) {
       aux[ii] -= aux[jj]*mat[ii*db_size + jj];
     }
   }

   /* backward */
   for (int ii = db_size - 1; ii >= 0; ii-=1) {
     x[ii] = aux[ii];
     for (int jj = db_size - 1; jj > ii; jj-=1) {
       x[ii] -= x[jj]*mat[ii*db_size + jj];
     }
     x[ii] /= mat[ii*(db_size + 1)];
   }
 }

 /*----------------------------------------------------------------------------
  * Block Gauss-Seidel utilities.
  * Compute forward and backward to solve an LU P*P system.
  *
  * parameters:
  *   mat     <-- P*P*dim matrix
  *   db_size <-- matrix size
  *   x       --> solution
  *   b       <-> RHS in, work array
  *----------------------------------------------------------------------------*/

 inline static void
 _fw_and_bw_lu_gs(const cs_real_t  mat[],
                  int              db_size,
                  cs_real_t        x[restrict],
                  const cs_real_t  b[restrict])
 {
   assert(db_size <= DB_SIZE_MAX);

   /* forward */
   for (int ii = 0; ii < db_size; ii++) {
     x[ii] = b[ii];
     for (int jj = 0; jj < ii; jj++)
       x[ii] -= x[jj]*mat[ii*db_size + jj];
   }

   /* backward */
   for (int ii = db_size - 1; ii >= 0; ii--) {
     for (int jj = db_size - 1; jj > ii; jj--)
       x[ii] -= x[jj]*mat[ii*db_size + jj];
     x[ii] /= mat[ii*(db_size + 1)];
   }
 }

 /*============================================================================
  * Public function definitions
  *============================================================================*/

 /*----------------------------------------------------------------------------*/
 /*----------------------------------------------------------------------------*/

 void
 cs_sles_it_convergence_init(cs_sles_it_convergence_t  *convergence,
                             const char                *solver_name,
                             int                        verbosity,
                             unsigned                   n_iter_max,
                             double                     precision,
                             double                     r_norm,
                             double                    *residue);

 /*----------------------------------------------------------------------------
  * Setup context for iterative linear solver.
  *
  * This function is common to most solvers
  *
  * parameters:
  *   c                <-> pointer to solver context info
  *   name             <-- pointer to system name
  *   a                <-- matrix
  *   verbosity        <-- verbosity level
  *   diag_block_size  <-- diagonal block size
  *   block_nn_inverse <-- if diagonal block size is 3 or 6, compute inverse of
  *                        block if true, inverse of block diagonal otherwise
  *----------------------------------------------------------------------------*/

 void
 cs_sles_it_setup_priv(cs_sles_it_t       *c,
                       const char         *name,
                       const cs_matrix_t  *a,
                       int                 verbosity,
                       int                 diag_block_size,
                       bool                block_nn_inverse);

 /*----------------------------------------------------------------------------*/

 END_C_DECLS

 #endif /* __CS_SLES_IT_PRIV_H__ */
cs_log.h

restrict
#define restrict
Definition: cs_defs.h:142

cs_dot_xx_xy_yz
void cs_dot_xx_xy_yz(cs_lnum_t n, const cs_real_t *restrict x, const cs_real_t *restrict y, const cs_real_t *restrict z, double *xx, double *xy, double *yz)
Return 3 dot products of 3 vectors: x.x, x.y, and y.z.
Definition: cs_blas.c:1622

bft_printf.h

cs_blas.h

cs_base.h

cs_dot_xy_yz
void cs_dot_xy_yz(cs_lnum_t n, const cs_real_t *restrict x, const cs_real_t *restrict y, const cs_real_t *restrict z, double *xy, double *yz)
Return 2 dot products of 3 vectors: x.y, and y.z.
Definition: cs_blas.c:1593

cs_file.h

cs_sles_it_type_t
cs_sles_it_type_t
Definition: cs_sles_it.h:55

cs_dot
double cs_dot(cs_lnum_t n, const cs_real_t *x, const cs_real_t *y)
Return the dot product of 2 vectors: x.y.
Definition: cs_blas.c:1465

cs_sles.h

cs_time_plot.h

cs_defs.h

cs_post.h

BEGIN_C_DECLS
#define BEGIN_C_DECLS
Definition: cs_defs.h:510

cs_sles_pc_t
struct _cs_sles_pc_t cs_sles_pc_t
Definition: cs_sles_pc.h:66

cs_sles_pc.h

cs_matrix.h

cs_sles_it_t
struct _cs_sles_it_t cs_sles_it_t
Definition: cs_sles_it.h:86

cs_matrix_default.h

cs_real_t
double cs_real_t
Floating-point value.
Definition: cs_defs.h:322

cs_dot_xx_xy
void cs_dot_xx_xy(cs_lnum_t n, const cs_real_t *restrict x, const cs_real_t *restrict y, double *xx, double *xy)
Return 2 dot products of 2 vectors: x.x, and x.y.
Definition: cs_blas.c:1566

cs_sles_pc_apply_t
cs_sles_pc_state_t() cs_sles_pc_apply_t(void *context, const cs_real_t *x_in, cs_real_t *x_out)
Function pointer for application of a preconditioner.
Definition: cs_sles_pc.h:145

cs_matrix_t
struct _cs_matrix_t cs_matrix_t
Definition: cs_matrix.h:110

cs_time_plot_t
struct _cs_time_plot_t cs_time_plot_t
Definition: cs_time_plot.h:48

cs_timer.h

cs_sles_convergence_state_t
cs_sles_convergence_state_t
Convergence status indicator.
Definition: cs_sles.h:56

atimbr::v
double precision, dimension(:,:,:), allocatable v
Definition: atimbr.f90:114

cs_dot_xx_yy_xy_xz_yz
void cs_dot_xx_yy_xy_xz_yz(cs_lnum_t n, const cs_real_t *restrict x, const cs_real_t *restrict y, const cs_real_t *restrict z, double *xx, double *yy, double *xy, double *xz, double *yz)
Return 5 dot products of 3 vectors: x.x, y.y, x.y, x.z, and y.z.
Definition: cs_blas.c:1654

cs_sles_it_convergence_t
struct _cs_sles_it_convergence_t cs_sles_it_convergence_t
Definition: cs_sles_it.h:90

bft_error.h

cs_fuel_incl::a
double precision, save a
Definition: cs_fuel_incl.f90:146

cs_halo.h

cs_dot_xx
double cs_dot_xx(cs_lnum_t n, const cs_real_t *x)
Return dot products of a vector with itself: x.x.
Definition: cs_blas.c:1486

cs_lnum_t
int cs_lnum_t
local mesh entity id
Definition: cs_defs.h:316

cs_mesh.h

END_C_DECLS
#define END_C_DECLS
Definition: cs_defs.h:511

bft_mem.h

cs_sles_it.h

cs_matrix_util.h

cs_timer_counter_t
Definition: cs_timer.h:55

cs_fuel_incl::b
double precision, save b
Definition: cs_fuel_incl.f90:146