opm-simulators/opm/simulators/linalg/bda/WellContributions.hpp

/*
  Copyright 2019 Equinor ASA

  This file is part of the Open Porous Media project (OPM).

  OPM is free software: you can redistribute it and/or modify
  it under the terms of the GNU General Public License as published by
  the Free Software Foundation, either version 3 of the License, or
  (at your option) any later version.

  OPM is distributed in the hope that it will be useful,
  but WITHOUT ANY WARRANTY; without even the implied warranty of
  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  GNU General Public License for more details.

  You should have received a copy of the GNU General Public License
  along with OPM.  If not, see <http://www.gnu.org/licenses/>.
*/

#ifndef WellContributions_H
#define WellContributions_H

#include <vector>

#if HAVE_CUDA
#include <cuda_runtime.h>
#endif

#include <config.h>

namespace Opm
{

    /// This class serves to eliminate the need to include the WellContributions into the matrix (with --matrix-add-well-contributions=true) for the cusparseSolver
    /// If the --matrix-add-well-contributions commandline parameter is true, this class should not be used
    class WellContributions
    {

    private:
        static bool gpu_mode;     // gpu_mode should be initialized in the ISTLSolverEbos constructor, and its value must not change afterwards
        unsigned int num_blocks = 0;    // total number of blocks in all wells
        unsigned int dim;
        unsigned int dim_wells;
        unsigned int num_wells = 0;
        unsigned int num_blocks_so_far = 0;
        unsigned int num_wells_so_far = 0;
        unsigned int *val_pointers = nullptr;     // val_pointers[wellID] == index of first block for this well in Ccols and Bcols
        bool allocated = false;

#if HAVE_CUDA
        double *d_Cnnzs = nullptr;
        double *d_Dnnzs = nullptr;
        double *d_Bnnzs = nullptr;
        int *d_Ccols = nullptr;
        int *d_Bcols = nullptr;
        double *d_z1 = nullptr;
        double *d_z2 = nullptr;
        unsigned int *d_val_pointers = nullptr;
        cudaStream_t stream;
#endif

        double *Cnnzs = nullptr;
        double *Dnnzs = nullptr;
        double *Bnnzs = nullptr;
        int *Ccols = nullptr;
        int *Dcols = nullptr;
        int *Bcols = nullptr;
        double *z1 = nullptr;                // z1 = B * x
        double *z2 = nullptr;                // z2 = D^-1 * B * x

        /// Apply the WellContributions on CPU
        void apply_cpu(double *x, double *y);

        /// Allocate memory on the CPU
        void alloc_cpu();

        /// Free memory on the CPU
        void free_cpu();

        /// Same as addMatrix(), stores matrix on CPU
        void addMatrix_cpu(int idx, int *colIndices, double *values, unsigned int val_size);

#if HAVE_CUDA
        /// Apply all wellcontributions on GPU, performs y -= C^T * (D^-1 * (B * x))
        /// Kernel is asynchronous
        void apply_gpu(double *d_x, double *d_y);

        /// Allocate memory on the GPU
        void alloc_gpu();

        /// Free memory on the GPU
        void free_gpu();

        /// Same as addMatrix(), stores matrix on GPU
        void addMatrix_gpu(int idx, int *colIndices, double *values, unsigned int val_size);
#endif

    public:
#if HAVE_CUDA
        /// Set a cudaStream to be used
        /// \param[in] stream           the cudaStream that is used to launch the kernel in
        void setCudaStream(cudaStream_t stream);
#endif

        /// Create a new WellContributions, implementation is empty
        WellContributions(){};

        /// Destroy a WellContributions, and free memory
        ~WellContributions();

        /// Apply all wellcontributions in this object
        void apply(double *x, double *y);

        /// Allocate memory for the wellcontributions
        void alloc_all();

        /// Indicate how large the next wellcontributions are, this function cannot be called after alloc_all() is called
        void addSizes(unsigned int nnz, unsigned int numEq, unsigned int numWellEq);

        /// Store a matrix in this object, in blocked csr format
        void addMatrix(int idx, int *colIndices, double *values, unsigned int val_size);

        /// Return the number of wells added to this object
        unsigned int get_num_wells(){
            return num_wells;
        }

        /// WellContributions can be applied on CPU or GPU
        /// This function sets the static variable, so each WellContributions is applied on the correct hardware
        static void setMode(bool use_gpu);

    };

} //namespace Opm

#endif
cusparseSolver can now apply wellcontributions separately, so --matrix-add-wellcontributions=true is not required anymore 2020-03-13 08:21:59 -05:00			`/*`
			`Copyright 2019 Equinor ASA`

			`This file is part of the Open Porous Media project (OPM).`

			`OPM is free software: you can redistribute it and/or modify`
			`it under the terms of the GNU General Public License as published by`
			`the Free Software Foundation, either version 3 of the License, or`
			`(at your option) any later version.`

			`OPM is distributed in the hope that it will be useful,`
			`but WITHOUT ANY WARRANTY; without even the implied warranty of`
			`MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the`
			`GNU General Public License for more details.`

			`You should have received a copy of the GNU General Public License`
			`along with OPM. If not, see <http://www.gnu.org/licenses/>.`
			`*/`

			`#ifndef WellContributions_H`
			`#define WellContributions_H`

			`#include <vector>`

			`#if HAVE_CUDA`
			`#include <cuda_runtime.h>`
			`#endif`

			`#include <config.h>`

			`namespace Opm`
			`{`

			`/// This class serves to eliminate the need to include the WellContributions into the matrix (with --matrix-add-well-contributions=true) for the cusparseSolver`
			`/// If the --matrix-add-well-contributions commandline parameter is true, this class should not be used`
			`class WellContributions`
			`{`

			`private:`
			`static bool gpu_mode; // gpu_mode should be initialized in the ISTLSolverEbos constructor, and its value must not change afterwards`
			`unsigned int num_blocks = 0; // total number of blocks in all wells`
			`unsigned int dim;`
			`unsigned int dim_wells;`
			`unsigned int num_wells = 0;`
			`unsigned int num_blocks_so_far = 0;`
			`unsigned int num_wells_so_far = 0;`
			`unsigned int *val_pointers = nullptr; // val_pointers[wellID] == index of first block for this well in Ccols and Bcols`
			`bool allocated = false;`

			`#if HAVE_CUDA`
			`double *d_Cnnzs = nullptr;`
			`double *d_Dnnzs = nullptr;`
			`double *d_Bnnzs = nullptr;`
			`int *d_Ccols = nullptr;`
			`int *d_Bcols = nullptr;`
			`double *d_z1 = nullptr;`
			`double *d_z2 = nullptr;`
			`unsigned int *d_val_pointers = nullptr;`
			`cudaStream_t stream;`
			`#endif`

			`double *Cnnzs = nullptr;`
			`double *Dnnzs = nullptr;`
			`double *Bnnzs = nullptr;`
			`int *Ccols = nullptr;`
			`int *Dcols = nullptr;`
			`int *Bcols = nullptr;`
			`double z1 = nullptr; // z1 = B x`
			`double z2 = nullptr; // z2 = D^-1 B * x`

			`/// Apply the WellContributions on CPU`
			`void apply_cpu(double x, double y);`

			`/// Allocate memory on the CPU`
			`void alloc_cpu();`

			`/// Free memory on the CPU`
			`void free_cpu();`

			`/// Same as addMatrix(), stores matrix on CPU`
			`void addMatrix_cpu(int idx, int colIndices, double values, unsigned int val_size);`

			`#if HAVE_CUDA`
			`/// Apply all wellcontributions on GPU, performs y -= C^T * (D^-1 * (B * x))`
			`/// Kernel is asynchronous`
			`void apply_gpu(double d_x, double d_y);`

			`/// Allocate memory on the GPU`
			`void alloc_gpu();`

			`/// Free memory on the GPU`
			`void free_gpu();`

			`/// Same as addMatrix(), stores matrix on GPU`
			`void addMatrix_gpu(int idx, int colIndices, double values, unsigned int val_size);`
			`#endif`

			`public:`
			`#if HAVE_CUDA`
			`/// Set a cudaStream to be used`
			`/// \param[in] stream the cudaStream that is used to launch the kernel in`
			`void setCudaStream(cudaStream_t stream);`
			`#endif`

			`/// Create a new WellContributions, implementation is empty`
			`WellContributions(){};`

			`/// Destroy a WellContributions, and free memory`
			`~WellContributions();`

			`/// Apply all wellcontributions in this object`
			`void apply(double x, double y);`

			`/// Allocate memory for the wellcontributions`
			`void alloc_all();`

			`/// Indicate how large the next wellcontributions are, this function cannot be called after alloc_all() is called`
			`void addSizes(unsigned int nnz, unsigned int numEq, unsigned int numWellEq);`

			`/// Store a matrix in this object, in blocked csr format`
			`void addMatrix(int idx, int colIndices, double values, unsigned int val_size);`

			`/// Return the number of wells added to this object`
			`unsigned int get_num_wells(){`
			`return num_wells;`
			`}`

			`/// WellContributions can be applied on CPU or GPU`
			`/// This function sets the static variable, so each WellContributions is applied on the correct hardware`
			`static void setMode(bool use_gpu);`

			`};`

			`} //namespace Opm`

			`#endif`