doxygen/src/cs__blas_8h_source.html

#ifndef __CS_BLAS_H__

#define __CS_BLAS_H__


/*============================================================================

 * BLAS (Basic Linear Algebra Subroutine) functions

 *============================================================================*/


/*

  This file is part of code_saturne, a general-purpose CFD tool.


  Copyright (C) 1998-2024 EDF S.A.


  This program is free software; you can redistribute it and/or modify it under

  the terms of the GNU General Public License as published by the Free Software

  Foundation; either version 2 of the License, or (at your option) any later

  version.


  This program is distributed in the hope that it will be useful, but WITHOUT

  ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS

  FOR A PARTICULAR PURPOSE.  See the GNU General Public License for more

  details.


  You should have received a copy of the GNU General Public License along with

  this program; if not, write to the Free Software Foundation, Inc., 51 Franklin

  Street, Fifth Floor, Boston, MA 02110-1301, USA.

*/


/*----------------------------------------------------------------------------*/


#include "cs_defs.h"


/*----------------------------------------------------------------------------

 * External library headers

 *----------------------------------------------------------------------------*/


/*----------------------------------------------------------------------------

 *  Local headers

 *----------------------------------------------------------------------------*/


#include "cs_base.h"

#include "cs_log.h"


/*----------------------------------------------------------------------------*/


BEGIN_C_DECLS


/*============================================================================

 * Macro definitions

 *============================================================================*/


/*============================================================================

 * Type definitions

 *============================================================================*/


/* BLAS reduction algorithm families */


typedef enum {


  CS_BLAS_REDUCE_SUPERBLOCK,

  CS_BLAS_REDUCE_KAHAN


} cs_blas_reduce_t;


/*============================================================================

 *  Public function prototypes

 *============================================================================*/


/*----------------------------------------------------------------------------*/

/*

 * \brief Print information on BLAS libraries used.

 *

 * \param[in]  log_type  log type

 */

/*----------------------------------------------------------------------------*/


void

cs_blas_library_info(cs_log_t  log_type);


/*----------------------------------------------------------------------------*/

/*

 * \brief Set the preferred BLAS reduction algorithm family.

 *

 * This may not be enforced for all algorithms, though it should at least

 * be enforced for the most general functions such as \ref cs_dot.

 *

 * \param[in]  mode   BLAS mode to use

 */

/*----------------------------------------------------------------------------*/


void

cs_blas_set_reduce_algorithm(cs_blas_reduce_t  mode);


/*----------------------------------------------------------------------------

 * Constant times a vector plus a vector: y <-- ax + y

 *

 * parameters:

 *   n <-- size of arrays x and y

 *   a <-- multiplier for x

 *   x <-- array of floating-point values

 *   y <-- array of floating-point values

 *----------------------------------------------------------------------------*/


void

cs_axpy(cs_lnum_t         n,

        double            a,

        const cs_real_t  *x,

        cs_real_t        *y);


/*----------------------------------------------------------------------------

 * Return the sum of a vector. For better precision, a superblock algorithm

 * is used.

 *

 * parameters:

 *   n <-- size of array x

 *   x <-- array of floating-point values

 *

 * returns:

 *   the resulting sum

 *----------------------------------------------------------------------------*/


double

cs_sum(cs_lnum_t         n,

       const cs_real_t  *x);


/*----------------------------------------------------------------------------

 * Return the weighted sum of a vector. For better precision, a superblock

 * algorithm is used.

 *

 * \param[in]  n  size of array x

 * \param[in]  w  array of floating-point weights

 * \param[in]  x  array of floating-point values

 *

 * \return the resulting weighted sum

 *----------------------------------------------------------------------------*/


double

cs_weighted_sum(cs_lnum_t         n,

                const cs_real_t  *w,

                const cs_real_t  *x);


/*----------------------------------------------------------------------------

 * Return the dot product of 2 vectors: x.y

 *

 * parameters:

 *   n <-- size of arrays x and y

 *   x <-- array of floating-point values

 *   y <-- array of floating-point values

 *

 * returns:

 *   dot product

 *----------------------------------------------------------------------------*/


double

cs_dot(cs_lnum_t         n,

       const cs_real_t  *x,

       const cs_real_t  *y);


/*----------------------------------------------------------------------------

 * Return dot products of a vector with itself: x.x

 *

 * parameters:

 *   n  <-- size of arrays x

 *   x  <-- array of floating-point values

 *

 * returns:

 *   dot product

 *----------------------------------------------------------------------------*/


double

cs_dot_xx(cs_lnum_t         n,

          const cs_real_t  *x);


/*----------------------------------------------------------------------------

 * Return weighted dot products of a vector with itself: x.x

 *

 * For better precision, a superblock algorithm is used.

 *

 * parameters:

 *   n  <-- size of arrays x

 *   w  <-- array of weights

 *   x  <-- array of floating-point values

 *

 * returns:

 *   dot product

 *----------------------------------------------------------------------------*/


double

cs_dot_wxx(cs_lnum_t         n,

           const cs_real_t  *w,

           const cs_real_t  *x);


/*----------------------------------------------------------------------------

 * Return the double dot product of 2 vectors: x.x, and x.y

 *

 * The products could be computed separately, but computing them

 * simultaneously adds more optimization opportunities and possibly better

 * cache behavior.

 *

 * parameters:

 *   n  <-- size of arrays x and y

 *   x  <-- array of floating-point values

 *   y  <-- array of floating-point values

 *   xx --> x.x dot product

 *   xy --> x.y dot product

 *----------------------------------------------------------------------------*/


void

cs_dot_xx_xy(cs_lnum_t         n,

             const cs_real_t  *x,

             const cs_real_t  *y,

             double           *xx,

             double           *xy);


/*----------------------------------------------------------------------------

 * Return the double dot product of 3 vectors: x.y, and y.z

 *

 * The products could be computed separately, but computing them

 * simultaneously adds more optimization opportunities and possibly better

 * cache behavior.

 *

 * parameters:

 *   n  <-- size of arrays x and y

 *   x  <-- array of floating-point values

 *   y  <-- array of floating-point values

 *   z  <-- array of floating-point values

 *   xy --> x.y dot product

 *   yz --> x.z dot product

 *----------------------------------------------------------------------------*/


void

cs_dot_xy_yz(cs_lnum_t         n,

             const cs_real_t  *x,

             const cs_real_t  *y,

             const cs_real_t  *z,

             double           *xx,

             double           *xy);


/*----------------------------------------------------------------------------

 * Return 3 dot products of 3 vectors: x.x, x.y, and y.z

 *

 * The products could be computed separately, but computing them

 * simultaneously adds more optimization opportunities and possibly better

 * cache behavior.

 *

 * parameters:

 *   n  <-- size of arrays x and y

 *   x  <-- array of floating-point values

 *   y  <-- array of floating-point values

 *   z  <-- array of floating-point values

 *   xx --> x.y dot product

 *   xy --> x.y dot product

 *   yz --> y.z dot product

 *----------------------------------------------------------------------------*/


void

cs_dot_xx_xy_yz(cs_lnum_t         n,

                const cs_real_t  *x,

                const cs_real_t  *y,

                const cs_real_t  *z,

                double           *xx,

                double           *xy,

                double           *yz);


/*----------------------------------------------------------------------------

 * Return 5 dot products of 3 vectors: x.x, y.y, x.y, x.z, and y.z

 *

 * The products could be computed separately, but computing them

 * simultaneously adds more optimization opportunities and possibly better

 * cache behavior.

 *

 * parameters:

 *   n  <-- size of arrays x and y

 *   x  <-- array of floating-point values

 *   y  <-- array of floating-point values

 *   z  <-- array of floating-point values

 *   xx --> x.y dot product

 *   yy --> y.y dot product

 *   xy --> x.y dot product

 *   xz --> x.z dot product

 *   yz --> y.z dot product

 *----------------------------------------------------------------------------*/


void

cs_dot_xx_yy_xy_xz_yz(cs_lnum_t         n,

                      const cs_real_t  *x,

                      const cs_real_t  *y,

                      const cs_real_t  *z,

                      double           *xx,

                      double           *yy,

                      double           *xy,

                      double           *xz,

                      double           *yz);


/*----------------------------------------------------------------------------

 * Return the global dot product of 2 vectors: x.y

 *

 * In parallel mode, the local results are summed on the default

 * global communicator.

 *

 * parameters:

 *   n <-- size of arrays x and y

 *   x <-- array of floating-point values

 *   y <-- array of floating-point values

 *

 * returns:

 *   dot product

 *----------------------------------------------------------------------------*/


double

cs_gdot(cs_lnum_t         n,

        const cs_real_t  *x,

        const cs_real_t  *y);


/*----------------------------------------------------------------------------

 * Return the global dot product of a vector: x.x

 *

 * In parallel mode, the local results are summed on the default

 * global communicator.

 *

 * parameters:

 *   n <-- size of arrays x and y

 *   x <-- array of floating-point values

 *

 * returns:

 *   dot product

 *----------------------------------------------------------------------------*/


double

cs_gdot_xx(cs_lnum_t n, const cs_real_t *x);


/*----------------------------------------------------------------------------

 * Return the global double dot product of 2 vectors: x.x, and x.y

 *

 * The products could be computed separately, but computing them

 * simultaneously adds more optimization opportunities and possibly better

 * cache behavior.

 *

 * In parallel mode, the local results are summed on the default

 * global communicator.

 *

 * parameters:

 *   n  <-- size of arrays x and y

 *   x  <-- array of floating-point values

 *   y  <-- array of floating-point values

 *   xx --> x.x dot product

 *   xy --> x.y dot product

 *----------------------------------------------------------------------------*/


void

cs_gdot_xx_xy(cs_lnum_t        n,

              const cs_real_t *x,

              const cs_real_t *y,

              double          *xx,

              double          *xy);


/*----------------------------------------------------------------------------

 * Return the global residual of 2 intensive vectors:

 *  1/sum(vol) . sum(vol.x.y)

 *

 * parameters:

 *   n   <-- size of arrays x and y

 *   vol <-- array of floating-point values

 *   x   <-- array of floating-point values

 *   y   <-- array of floating-point values

 *

 * returns:

 *   global residual

 *----------------------------------------------------------------------------*/


double

cs_gres(cs_lnum_t         n,

        const cs_real_t  *vol,

        const cs_real_t  *x,

        const cs_real_t  *y);


/*----------------------------------------------------------------------------

 * Return the global volume weighted mean

 *  1/sum(vol) . sum(vol.x)

 *

 * parameters:

 *   n   <-- size of arrays x

 *   vol <-- array of floating-point values

 *   x   <-- array of floating-point values

 *

 * returns:

 *   global residual

 *----------------------------------------------------------------------------*/


double

cs_gmean(cs_lnum_t         n,

         const cs_real_t  *vol,

         const cs_real_t  *x);


/*----------------------------------------------------------------------------*/


END_C_DECLS


#endif /* __CS_BLAS_H__ */

cs_base.h

cs_gmean
double cs_gmean(cs_lnum_t n, const cs_real_t *vol, const cs_real_t *x)
Return the global spacial average of an intensive vectors: 1/sum(vol) . sum(x.vol)
Definition: cs_blas.cpp:1828

cs_dot_wxx
double cs_dot_wxx(cs_lnum_t n, const cs_real_t *w, const cs_real_t *x)
Definition: cs_blas.cpp:1535

cs_axpy
void cs_axpy(cs_lnum_t n, double a, const cs_real_t *x, cs_real_t *y)

cs_dot
double cs_dot(cs_lnum_t n, const cs_real_t *x, const cs_real_t *y)
Return the dot product of 2 vectors: x.y.
Definition: cs_blas.cpp:1495

cs_gdot_xx_xy
void cs_gdot_xx_xy(cs_lnum_t n, const cs_real_t *x, const cs_real_t *y, double *xx, double *xy)
Definition: cs_blas.cpp:1769

cs_gdot_xx
double cs_gdot_xx(cs_lnum_t n, const cs_real_t *x)
Definition: cs_blas.cpp:1741

cs_dot_xy_yz
void cs_dot_xy_yz(cs_lnum_t n, const cs_real_t *x, const cs_real_t *y, const cs_real_t *z, double *xx, double *xy)

cs_weighted_sum
double cs_weighted_sum(cs_lnum_t n, const cs_real_t *w, const cs_real_t *x)
Definition: cs_blas.cpp:1438

cs_dot_xx
double cs_dot_xx(cs_lnum_t n, const cs_real_t *x)
Return dot products of a vector with itself: x.x.
Definition: cs_blas.cpp:1516

cs_dot_xx_xy_yz
void cs_dot_xx_xy_yz(cs_lnum_t n, const cs_real_t *x, const cs_real_t *y, const cs_real_t *z, double *xx, double *xy, double *yz)

cs_blas_reduce_t
cs_blas_reduce_t
Definition: cs_blas.h:57

CS_BLAS_REDUCE_KAHAN
@ CS_BLAS_REDUCE_KAHAN
Definition: cs_blas.h:60

CS_BLAS_REDUCE_SUPERBLOCK
@ CS_BLAS_REDUCE_SUPERBLOCK
Definition: cs_blas.h:59

cs_blas_set_reduce_algorithm
void cs_blas_set_reduce_algorithm(cs_blas_reduce_t mode)
Set the preferred BLAS reduction algorithm family.
Definition: cs_blas.cpp:1312

cs_dot_xx_yy_xy_xz_yz
void cs_dot_xx_yy_xy_xz_yz(cs_lnum_t n, const cs_real_t *x, const cs_real_t *y, const cs_real_t *z, double *xx, double *yy, double *xy, double *xz, double *yz)

cs_gres
double cs_gres(cs_lnum_t n, const cs_real_t *vol, const cs_real_t *x, const cs_real_t *y)
Return the global residual of 2 intensive vectors: 1/sum(vol) . sum(x.y.vol)
Definition: cs_blas.cpp:1803

cs_dot_xx_xy
void cs_dot_xx_xy(cs_lnum_t n, const cs_real_t *x, const cs_real_t *y, double *xx, double *xy)

cs_sum
double cs_sum(cs_lnum_t n, const cs_real_t *x)
Definition: cs_blas.cpp:1384

cs_blas_library_info
void cs_blas_library_info(cs_log_t log_type)
Print information on BLAS libraries used.
Definition: cs_blas.cpp:1284

cs_gdot
double cs_gdot(cs_lnum_t n, const cs_real_t *x, const cs_real_t *y)
Return the global dot product of 2 vectors: x.y.
Definition: cs_blas.cpp:1715

cs_defs.h

BEGIN_C_DECLS
#define BEGIN_C_DECLS
Definition: cs_defs.h:542

cs_real_t
double cs_real_t
Floating-point value.
Definition: cs_defs.h:342

END_C_DECLS
#define END_C_DECLS
Definition: cs_defs.h:543

cs_lnum_t
int cs_lnum_t
local mesh entity id
Definition: cs_defs.h:335

cs_log.h

cs_log_t
cs_log_t
Definition: cs_log.h:48