2019-12-03 07:10:21 -06:00
/*
2019-12-05 07:24:37 -06:00
Copyright 2019 Equinor ASA
2019-12-03 07:10:21 -06:00
This file is part of the Open Porous Media project ( OPM ) .
OPM is free software : you can redistribute it and / or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation , either version 3 of the License , or
( at your option ) any later version .
OPM is distributed in the hope that it will be useful ,
but WITHOUT ANY WARRANTY ; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE . See the
GNU General Public License for more details .
You should have received a copy of the GNU General Public License
along with OPM . If not , see < http : //www.gnu.org/licenses/>.
*/
# include <config.h>
2019-12-06 04:05:41 -06:00
# include <opm/common/OpmLog/OpmLog.hpp>
2019-12-18 08:47:35 -06:00
# include <opm/common/ErrorMacros.hpp>
2019-12-06 04:27:17 -06:00
# include <opm/material/common/Unused.hpp>
2019-12-06 04:05:41 -06:00
2019-12-04 09:59:58 -06:00
# include <opm/simulators/linalg/bda/BdaBridge.hpp>
# include <opm/simulators/linalg/bda/BdaResult.hpp>
2019-12-03 07:10:21 -06:00
2021-02-23 05:31:09 -06:00
# if HAVE_CUDA
# include <opm/simulators/linalg/bda/cusparseSolverBackend.hpp>
# endif
# if HAVE_OPENCL
# include <opm/simulators/linalg/bda/openclSolverBackend.hpp>
# endif
# if HAVE_FPGA
# include <opm/simulators/linalg/bda/FPGASolverBackend.hpp>
# endif
2019-12-06 04:27:17 -06:00
# define PRINT_TIMERS_BRIDGE 0
2019-12-03 07:10:21 -06:00
typedef Dune : : InverseOperatorResult InverseOperatorResult ;
namespace Opm
{
2020-06-22 11:26:49 -05:00
using bda : : BdaResult ;
using bda : : BdaSolver ;
2020-07-02 05:11:42 -05:00
using bda : : SolverStatus ;
2020-10-16 08:05:02 -05:00
using bda : : ILUReorder ;
2020-06-22 11:26:49 -05:00
2020-06-24 09:46:04 -05:00
template < class BridgeMatrix , class BridgeVector , int block_size >
2021-04-19 02:49:20 -05:00
BdaBridge < BridgeMatrix , BridgeVector , block_size > : : BdaBridge ( std : : string accelerator_mode_ ,
[[maybe_unused]] std : : string fpga_bitstream ,
int linear_solver_verbosity , int maxit ,
2021-05-28 09:05:15 -05:00
double tolerance ,
[[maybe_unused]] unsigned int platformID ,
2021-04-19 02:49:20 -05:00
unsigned int deviceID ,
[[maybe_unused]] std : : string opencl_ilu_reorder )
2020-12-22 05:57:01 -06:00
: accelerator_mode ( accelerator_mode_ )
2020-02-13 04:04:02 -06:00
{
2020-12-22 05:57:01 -06:00
if ( accelerator_mode . compare ( " cusparse " ) = = 0 ) {
2020-06-23 11:19:33 -05:00
# if HAVE_CUDA
2020-06-22 11:26:49 -05:00
use_gpu = true ;
2020-07-01 12:43:22 -05:00
backend . reset ( new bda : : cusparseSolverBackend < block_size > ( linear_solver_verbosity , maxit , tolerance , deviceID ) ) ;
2020-06-23 11:19:33 -05:00
# else
OPM_THROW ( std : : logic_error , " Error cusparseSolver was chosen, but CUDA was not found by CMake " ) ;
# endif
2020-12-22 05:57:01 -06:00
} else if ( accelerator_mode . compare ( " opencl " ) = = 0 ) {
2020-06-22 11:26:49 -05:00
# if HAVE_OPENCL
use_gpu = true ;
2020-12-22 05:57:01 -06:00
ILUReorder ilu_reorder ;
if ( opencl_ilu_reorder = = " " ) {
ilu_reorder = bda : : ILUReorder : : GRAPH_COLORING ; // default when not selected by user
} else if ( opencl_ilu_reorder = = " level_scheduling " ) {
2020-10-16 08:05:02 -05:00
ilu_reorder = bda : : ILUReorder : : LEVEL_SCHEDULING ;
} else if ( opencl_ilu_reorder = = " graph_coloring " ) {
ilu_reorder = bda : : ILUReorder : : GRAPH_COLORING ;
2020-12-17 07:49:59 -06:00
} else if ( opencl_ilu_reorder = = " none " ) {
ilu_reorder = bda : : ILUReorder : : NONE ;
2020-10-16 08:05:02 -05:00
} else {
OPM_THROW ( std : : logic_error , " Error invalid argument for --opencl-ilu-reorder, usage: '--opencl-ilu-reorder=[level_scheduling|graph_coloring]' " ) ;
}
backend . reset ( new bda : : openclSolverBackend < block_size > ( linear_solver_verbosity , maxit , tolerance , platformID , deviceID , ilu_reorder ) ) ;
2020-06-22 11:26:49 -05:00
# else
OPM_THROW ( std : : logic_error , " Error openclSolver was chosen, but OpenCL was not found by CMake " ) ;
# endif
2020-12-22 05:57:01 -06:00
} else if ( accelerator_mode . compare ( " fpga " ) = = 0 ) {
# if HAVE_FPGA
use_fpga = true ;
ILUReorder ilu_reorder ;
if ( opencl_ilu_reorder = = " " ) {
ilu_reorder = bda : : ILUReorder : : LEVEL_SCHEDULING ; // default when not selected by user
} else if ( opencl_ilu_reorder = = " level_scheduling " ) {
ilu_reorder = bda : : ILUReorder : : LEVEL_SCHEDULING ;
} else if ( opencl_ilu_reorder = = " graph_coloring " ) {
ilu_reorder = bda : : ILUReorder : : GRAPH_COLORING ;
} else {
OPM_THROW ( std : : logic_error , " Error invalid argument for --opencl-ilu-reorder, usage: '--opencl-ilu-reorder=[level_scheduling|graph_coloring]' " ) ;
}
backend . reset ( new bda : : FpgaSolverBackend < block_size > ( fpga_bitstream , linear_solver_verbosity , maxit , tolerance , ilu_reorder ) ) ;
# else
OPM_THROW ( std : : logic_error , " Error fpgaSolver was chosen, but FPGA was not enabled by CMake " ) ;
# endif
} else if ( accelerator_mode . compare ( " none " ) = = 0 ) {
2020-06-23 11:19:33 -05:00
use_gpu = false ;
2020-12-22 05:57:01 -06:00
use_fpga = false ;
2020-06-23 11:19:33 -05:00
} else {
2020-12-22 05:57:01 -06:00
OPM_THROW ( std : : logic_error , " Error unknown value for parameter 'AcceleratorMode', should be passed like '--accelerator-mode=[none|cusparse|opencl|fpga] " ) ;
2019-12-18 08:50:09 -06:00
}
2019-12-03 07:10:21 -06:00
}
2019-12-16 03:05:12 -06:00
2019-12-18 08:47:35 -06:00
2019-12-03 07:10:21 -06:00
template < class BridgeMatrix >
int checkZeroDiagonal ( BridgeMatrix & mat ) {
2019-12-18 08:50:09 -06:00
static std : : vector < typename BridgeMatrix : : size_type > diag_indices ; // contains offsets of the diagonal nnzs
int numZeros = 0 ;
2019-12-18 09:37:29 -06:00
const int dim = 3 ; // might be replaced with mat[0][0].N() or BridgeMatrix::block_type::size()
2019-12-18 08:50:09 -06:00
const double zero_replace = 1e-15 ;
2019-12-18 08:54:14 -06:00
if ( diag_indices . size ( ) = = 0 ) {
2019-12-18 08:50:09 -06:00
int N = mat . N ( ) ;
diag_indices . reserve ( N ) ;
2019-12-18 08:54:14 -06:00
for ( typename BridgeMatrix : : iterator r = mat . begin ( ) ; r ! = mat . end ( ) ; + + r ) {
2019-12-18 08:50:09 -06:00
auto diag = r - > find ( r . index ( ) ) ; // diag is an iterator
assert ( diag . index ( ) = = r . index ( ) ) ;
2019-12-18 08:54:14 -06:00
for ( int rr = 0 ; rr < dim ; + + rr ) {
2019-12-18 08:50:09 -06:00
auto & val = ( * diag ) [ rr ] [ rr ] ; // reference to easily change the value
2019-12-18 08:54:14 -06:00
if ( val = = 0.0 ) { // could be replaced by '< 1e-30' or similar
2019-12-18 08:50:09 -06:00
val = zero_replace ;
+ + numZeros ;
}
}
diag_indices . emplace_back ( diag . offset ( ) ) ;
}
} else {
2019-12-18 08:54:14 -06:00
for ( typename BridgeMatrix : : iterator r = mat . begin ( ) ; r ! = mat . end ( ) ; + + r ) {
2019-12-18 08:50:09 -06:00
typename BridgeMatrix : : size_type offset = diag_indices [ r . index ( ) ] ;
auto & diag_block = r - > getptr ( ) [ offset ] ; // diag_block is a reference to MatrixBlock, located on column r of row r
2019-12-18 08:54:14 -06:00
for ( int rr = 0 ; rr < dim ; + + rr ) {
2019-12-18 08:50:09 -06:00
auto & val = diag_block [ rr ] [ rr ] ;
2019-12-18 08:54:14 -06:00
if ( val = = 0.0 ) { // could be replaced by '< 1e-30' or similar
2019-12-18 08:50:09 -06:00
val = zero_replace ;
+ + numZeros ;
}
}
}
}
return numZeros ;
2019-12-03 07:10:21 -06:00
}
2019-12-06 07:33:52 -06:00
// iterate sparsity pattern from Matrix and put colIndices and rowPointers in arrays
2021-03-04 04:49:29 -06:00
// sparsity pattern should stay the same
2019-12-18 08:47:35 -06:00
// this could be removed if Dune::BCRSMatrix features an API call that returns colIndices and rowPointers
2019-12-03 07:10:21 -06:00
template < class BridgeMatrix >
2019-12-06 10:23:32 -06:00
void getSparsityPattern ( BridgeMatrix & mat , std : : vector < int > & h_rows , std : : vector < int > & h_cols ) {
2019-12-18 08:50:09 -06:00
int sum_nnzs = 0 ;
// convert colIndices and rowPointers
2019-12-18 08:54:14 -06:00
if ( h_rows . size ( ) = = 0 ) {
2019-12-18 08:50:09 -06:00
h_rows . emplace_back ( 0 ) ;
2019-12-18 08:54:14 -06:00
for ( typename BridgeMatrix : : const_iterator r = mat . begin ( ) ; r ! = mat . end ( ) ; + + r ) {
2019-12-18 08:50:09 -06:00
int size_row = 0 ;
2019-12-18 08:54:14 -06:00
for ( auto c = r - > begin ( ) ; c ! = r - > end ( ) ; + + c ) {
2019-12-18 08:50:09 -06:00
h_cols . emplace_back ( c . index ( ) ) ;
size_row + + ;
}
sum_nnzs + = size_row ;
h_rows . emplace_back ( sum_nnzs ) ;
}
2019-12-18 09:37:29 -06:00
// h_rows and h_cols could be changed to 'unsigned int', but cusparse expects 'int'
if ( static_cast < unsigned int > ( h_rows [ mat . N ( ) ] ) ! = mat . nonzeroes ( ) ) {
2019-12-18 08:50:09 -06:00
OPM_THROW ( std : : logic_error , " Error size of rows do not sum to number of nonzeroes in BdaBridge::getSparsityPattern() " ) ;
}
}
2019-12-06 07:33:52 -06:00
} // end getSparsityPattern()
2019-12-03 07:10:21 -06:00
2020-06-24 09:46:04 -05:00
template < class BridgeMatrix , class BridgeVector , int block_size >
void BdaBridge < BridgeMatrix , BridgeVector , block_size > : : solve_system ( BridgeMatrix * mat OPM_UNUSED , BridgeVector & b OPM_UNUSED , WellContributions & wellContribs OPM_UNUSED , InverseOperatorResult & res OPM_UNUSED )
2019-12-03 07:10:21 -06:00
{
2020-12-22 05:57:01 -06:00
if ( use_gpu | | use_fpga ) {
2019-12-18 08:50:09 -06:00
BdaResult result ;
result . converged = false ;
static std : : vector < int > h_rows ;
static std : : vector < int > h_cols ;
2019-12-18 09:37:29 -06:00
const int dim = ( * mat ) [ 0 ] [ 0 ] . N ( ) ;
2021-03-04 04:49:29 -06:00
const int Nb = mat - > N ( ) ;
const int N = Nb * dim ;
const int nnzb = ( h_rows . empty ( ) ) ? mat - > nonzeroes ( ) : h_rows . back ( ) ;
const int nnz = nnzb * dim * dim ;
2019-12-18 08:50:09 -06:00
2019-12-18 08:54:14 -06:00
if ( dim ! = 3 ) {
2019-12-18 08:50:09 -06:00
OpmLog : : warning ( " cusparseSolver only accepts blocksize = 3 at this time, will use Dune for the remainder of the program " ) ;
use_gpu = false ;
2020-03-19 08:09:42 -05:00
return ;
2019-12-18 08:50:09 -06:00
}
2019-12-18 08:54:14 -06:00
if ( h_rows . capacity ( ) = = 0 ) {
2021-03-04 04:49:29 -06:00
h_rows . reserve ( Nb + 1 ) ;
h_cols . reserve ( nnzb ) ;
2019-12-06 07:33:52 -06:00
# if PRINT_TIMERS_BRIDGE
2019-12-18 08:50:09 -06:00
Dune : : Timer t ;
2019-12-06 07:33:52 -06:00
# endif
2019-12-18 08:50:09 -06:00
getSparsityPattern ( * mat , h_rows , h_cols ) ;
2019-12-06 07:33:52 -06:00
# if PRINT_TIMERS_BRIDGE
2019-12-18 08:50:09 -06:00
std : : ostringstream out ;
out < < " getSparsityPattern() took: " < < t . stop ( ) < < " s " ;
OpmLog : : info ( out . str ( ) ) ;
2019-12-06 07:33:52 -06:00
# endif
2019-12-18 08:50:09 -06:00
}
2019-12-03 07:10:21 -06:00
# if PRINT_TIMERS_BRIDGE
2019-12-18 08:50:09 -06:00
Dune : : Timer t_zeros ;
int numZeros = checkZeroDiagonal ( * mat ) ;
std : : ostringstream out ;
out < < " Checking zeros took: " < < t_zeros . stop ( ) < < " s, found " < < numZeros < < " zeros " ;
OpmLog : : info ( out . str ( ) ) ;
2019-12-03 07:10:21 -06:00
# else
2019-12-18 08:50:09 -06:00
checkZeroDiagonal ( * mat ) ;
2019-12-03 07:10:21 -06:00
# endif
2019-12-18 08:50:09 -06:00
/////////////////////////
// actually solve
// assume that underlying data (nonzeroes) from mat (Dune::BCRSMatrix) are contiguous, if this is not the case, cusparseSolver is expected to perform undefined behaviour
2020-07-02 05:11:42 -05:00
SolverStatus status = backend - > solve_system ( N , nnz , dim , static_cast < double * > ( & ( ( ( * mat ) [ 0 ] [ 0 ] [ 0 ] [ 0 ] ) ) ) , h_rows . data ( ) , h_cols . data ( ) , static_cast < double * > ( & ( b [ 0 ] [ 0 ] ) ) , wellContribs , result ) ;
2019-12-18 08:54:14 -06:00
switch ( status ) {
2020-07-02 05:11:42 -05:00
case SolverStatus : : BDA_SOLVER_SUCCESS :
2020-06-23 04:30:15 -05:00
//OpmLog::info("BdaSolver converged");
2019-12-18 08:50:09 -06:00
break ;
2020-07-02 05:11:42 -05:00
case SolverStatus : : BDA_SOLVER_ANALYSIS_FAILED :
2020-06-22 11:26:49 -05:00
OpmLog : : warning ( " BdaSolver could not analyse level information of matrix, perhaps there is still a 0.0 on the diagonal of a block on the diagonal " ) ;
2019-12-18 08:50:09 -06:00
break ;
2020-07-02 05:11:42 -05:00
case SolverStatus : : BDA_SOLVER_CREATE_PRECONDITIONER_FAILED :
2020-06-22 11:26:49 -05:00
OpmLog : : warning ( " BdaSolver could not create preconditioner, perhaps there is still a 0.0 on the diagonal of a block on the diagonal " ) ;
2019-12-18 08:50:09 -06:00
break ;
default :
2020-06-22 11:26:49 -05:00
OpmLog : : warning ( " BdaSolver returned unknown status code " ) ;
2019-12-18 08:50:09 -06:00
}
res . iterations = result . iterations ;
res . reduction = result . reduction ;
res . converged = result . converged ;
res . conv_rate = result . conv_rate ;
res . elapsed = result . elapsed ;
2020-12-22 05:57:01 -06:00
} else {
2019-12-18 08:50:09 -06:00
res . converged = false ;
}
2019-12-03 07:10:21 -06:00
}
2020-06-24 09:46:04 -05:00
template < class BridgeMatrix , class BridgeVector , int block_size >
void BdaBridge < BridgeMatrix , BridgeVector , block_size > : : get_result ( BridgeVector & x OPM_UNUSED ) {
2020-12-22 05:57:01 -06:00
if ( use_gpu | | use_fpga ) {
2020-06-22 11:26:49 -05:00
backend - > get_result ( static_cast < double * > ( & ( x [ 0 ] [ 0 ] ) ) ) ;
2019-12-18 08:50:09 -06:00
}
2019-12-03 07:10:21 -06:00
}
2021-02-23 05:31:09 -06:00
template < class BridgeMatrix , class BridgeVector , int block_size >
2021-05-28 09:05:15 -05:00
void BdaBridge < BridgeMatrix , BridgeVector , block_size > : : initWellContributions ( [[maybe_unused]] WellContributions & wellContribs ) {
2020-12-22 05:57:01 -06:00
if ( accelerator_mode . compare ( " opencl " ) = = 0 ) {
2021-02-23 05:31:09 -06:00
# if HAVE_OPENCL
const auto openclBackend = static_cast < const bda : : openclSolverBackend < block_size > * > ( backend . get ( ) ) ;
wellContribs . setOpenCLEnv ( openclBackend - > context . get ( ) , openclBackend - > queue . get ( ) ) ;
# else
OPM_THROW ( std : : logic_error , " Error openclSolver was chosen, but OpenCL was not found by CMake " ) ;
# endif
}
}
2021-06-01 06:50:27 -05:00
// the tests use Dune::FieldMatrix, Flow uses Opm::MatrixBlock
# define INSTANTIATE_BDA_FUNCTIONS(n) \
template class BdaBridge < Dune : : BCRSMatrix < Opm : : MatrixBlock < double , n , n > , std : : allocator < Opm : : MatrixBlock < double , n , n > > > , \
Dune : : BlockVector < Dune : : FieldVector < double , n > , std : : allocator < Dune : : FieldVector < double , n > > > , \
n > ; \
\
template class BdaBridge < Dune : : BCRSMatrix < Dune : : FieldMatrix < double , n , n > , std : : allocator < Dune : : FieldMatrix < double , n , n > > > , \
Dune : : BlockVector < Dune : : FieldVector < double , n > , std : : allocator < Dune : : FieldVector < double , n > > > , \
2021-06-01 06:12:52 -05:00
n > ;
2021-02-23 05:31:09 -06:00
2020-05-13 09:29:36 -05:00
INSTANTIATE_BDA_FUNCTIONS ( 1 ) ;
INSTANTIATE_BDA_FUNCTIONS ( 2 ) ;
INSTANTIATE_BDA_FUNCTIONS ( 3 ) ;
INSTANTIATE_BDA_FUNCTIONS ( 4 ) ;
# undef INSTANTIATE_BDA_FUNCTIONS
2019-12-03 07:10:21 -06:00
2020-06-24 13:09:14 -05:00
} // namespace Opm
2019-12-03 07:10:21 -06:00