Added doxygen-style comments

2025-02-11 06:25:34 -06:00 · 2019-12-18 17:05:33 +01:00 · 2019-12-18 17:05:33 +01:00 · 57344fd5e0
commit 57344fd5e0
parent 6506ab5f55
5 changed files with 59 additions and 5 deletions
--- a/opm/simulators/linalg/bda/BdaBridge.cpp
+++ b/opm/simulators/linalg/bda/BdaBridge.cpp
@ -35,7 +35,7 @@ typedef Dune::InverseOperatorResult InverseOperatorResult;
 namespace Opm
 {

-BdaBridge::BdaBridge(bool use_gpu_, int linear_solver_verbosity OPM_UNUSED, int maxit OPM_UNUSED, double tolerance OPM_UNUSED) : use_gpu(use_gpu_) {
+BdaBridge::BdaBridge(bool use_gpu_ OPM_UNUSED, int linear_solver_verbosity OPM_UNUSED, int maxit OPM_UNUSED, double tolerance OPM_UNUSED) : use_gpu(use_gpu_) {
 #if HAVE_CUDA
    if (use_gpu) {
        backend.reset(new cusparseSolverBackend(linear_solver_verbosity, maxit, tolerance));
--- a/opm/simulators/linalg/bda/BdaBridge.hpp
+++ b/opm/simulators/linalg/bda/BdaBridge.hpp
@ -35,7 +35,8 @@ namespace Opm

 typedef Dune::InverseOperatorResult InverseOperatorResult;

-
+/// BdaBridge acts as interface between opm-simulators with the cusparseSolver
+/// if CUDA was not found during CMake, function bodies of this class are empty
 class BdaBridge
 {
 private:
@ -45,11 +46,23 @@ private:
    bool use_gpu;

 public:
+    /// Construct a BdaBridge
+    /// \param[in] use_gpu                    true iff the cusparseSolver is used, is passed via command-line: '--use-gpu=[true|false]'
+    /// \param[in] linear_solver_verbosity    verbosity of cusparseSolver
+    /// \param[in] maxit                      maximum number of iterations for cusparseSolver
+    /// \param[in] tolerance                  required relative tolerance for cusparseSolver
    BdaBridge(bool use_gpu, int linear_solver_verbosity, int maxit, double tolerance);

+
+    /// Solve linear system, A*x = b
+    /// \param[in] mat     matrix A, should be of type Dune::BCRSMatrix
+    /// \param[in] b       vector b, should be of type Dune::BlockVector
+    /// \param[in] result  summary of solver result
    template <class BridgeMatrix, class BridgeVector>
    void solve_system(BridgeMatrix *mat, BridgeVector &b, InverseOperatorResult &result);

+    /// Get the resulting x vector
+    /// \param[inout] x    vector x, should be of type Dune::BlockVector
    template <class BridgeVector>
    void get_result(BridgeVector &x);

--- a/opm/simulators/linalg/bda/BdaResult.hpp
+++ b/opm/simulators/linalg/bda/BdaResult.hpp
@ -23,7 +23,8 @@
 namespace Opm
 {

-// based on InverseOperatorResult struct from dune/istl/solver.hh
+/// This class is based on InverseOperatorResult struct from dune/istl/solver.hh
+/// It is needed to prevent a compile error in basearray.hh, the nvcc compiler might not support all features in there
 class BdaResult
 {

--- a/opm/simulators/linalg/bda/cuda_header.hpp
+++ b/opm/simulators/linalg/bda/cuda_header.hpp
@ -22,6 +22,11 @@

 #include <iostream>

+/// Runtime error checking of CUDA functions
+/// Usage:
+/// cudaMalloc(...);
+/// cudaCheckLastError("Error could not allocate memory");
+///
 #define cudaCheckLastError(msg)    __cudaCheckError( __FILE__, __LINE__, #msg )

 inline void __cudaCheckError(const char *file, const int line, const char *msg){
--- a/opm/simulators/linalg/bda/cusparseSolverBackend.hpp
+++ b/opm/simulators/linalg/bda/cusparseSolverBackend.hpp
@ -29,6 +29,7 @@
 namespace Opm
 {

+/// This class implements a cusparse-based ilu0-bicgstab solver on GPU
 class cusparseSolverBackend{

 private:
@ -68,24 +69,42 @@ private:

    int verbosity = 0;

-
+    /// Solve linear system using ilu0-bicgstab
+    /// \param[inout] res     summary of solver result
    void gpu_pbicgstab(BdaResult& res);

+    /// Initialize GPU and allocate memory
+    /// \param[in] N         number of nonzeroes, divide by dim*dim to get number of blocks
+    /// \param[in] nnz         number of nonzeroes, divide by dim*dim to get number of blocks
+    /// \param[in] dim         size of block
    void initialize(int N, int nnz, int dim);

+    /// Clean memory
    void finalize();

+    /// Copy linear system to GPU
+    /// \param[in] vals        array of nonzeroes, each block is stored row-wise and contiguous, contains nnz values
+    /// \param[in] rows        array of rowPointers, contains N/dim+1 values
+    /// \param[in] cols        array of columnIndices, contains nnz values
+    /// \param[in] b           input vector, contains N values
    void copy_system_to_gpu(double *vals, int *rows, int *cols, double *b);

-    // don't copy rowpointers and colindices, they stay the same
+    // Update linear system on GPU, don't copy rowpointers and colindices, they stay the same
+    /// \param[in] vals        array of nonzeroes, each block is stored row-wise and contiguous, contains nnz values
+    /// \param[in] b           input vector, contains N values
    void update_system_on_gpu(double *vals, double *b);

+    /// Reset preconditioner on GPU, ilu0-decomposition is done inplace by cusparse
    void reset_prec_on_gpu();

+    /// Analyse sparsity pattern to extract parallelism
    bool analyse_matrix();

+    /// Perform ilu0-decomposition
    bool create_preconditioner();

+    /// Solve linear system
+    /// \param[inout] res     summary of solver result
    void solve_system(BdaResult &res);

 public:
@ -97,12 +116,28 @@ public:
        CUSPARSE_SOLVER_UNKNOWN_ERROR
    };

+    /// Construct a cusparseSolver
+    /// \param[in] linear_solver_verbosity    verbosity of cusparseSolver
+    /// \param[in] maxit                      maximum number of iterations for cusparseSolver
+    /// \param[in] tolerance                  required relative tolerance for cusparseSolver
    cusparseSolverBackend(int linear_solver_verbosity, int maxit, double tolerance);

+    /// Destroy a cusparseSolver, and free memory
    ~cusparseSolverBackend();

+    /// Solve linear system, A*x = b, matrix A must be in blocked-CSR format
+    /// \param[in] N           number of rows, divide by dim to get number of blockrows
+    /// \param[in] nnz         number of nonzeroes, divide by dim*dim to get number of blocks
+    /// \param[in] dim         size of block
+    /// \param[in] vals        array of nonzeroes, each block is stored row-wise and contiguous, contains nnz values
+    /// \param[in] rows        array of rowPointers, contains N/dim+1 values
+    /// \param[in] cols        array of columnIndices, contains nnz values
+    /// \param[in] b           input vector, contains N values
+    /// \param[inout] res      summary of solver result
    cusparseSolverStatus solve_system(int N, int nnz, int dim, double *vals, int *rows, int *cols, double *b, BdaResult &res);

+    /// Post processing after linear solve, now only copies resulting x vector back
+    /// \param[inout] x        resulting x vector, caller must guarantee that x points to a valid array
    void post_process(double *x);

 }; // end class cusparseSolverBackend