/*
Copyright 2020 Equinor ASA
This file is part of the Open Porous Media project (OPM).
OPM is free software: you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation, either version 3 of the License, or
(at your option) any later version.
OPM is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with OPM. If not, see .
*/
#ifndef FPGA_MATRIX_HEADER_INCLUDED
#define FPGA_MATRIX_HEADER_INCLUDED
#include
namespace bda
{
/// This struct resembles a csr matrix, only doubles are supported
/// The data is stored in contiguous memory, such that they can be copied to a device in one transfer.
class Matrix {
public:
/// Allocate Matrix and data arrays with given sizes
/// \param[in] N number of rows
/// \param[in] nnzs number of nonzeros
Matrix(int N_, int nnzs_)
: nnzValues(new double[nnzs_]),
colIndices(new int[nnzs_]),
rowPointers(new int[N_+1]),
N(N_),
nnzs(nnzs_)
{}
/// All constructors allocate new memory, so always delete here
~Matrix(){
delete[] nnzValues;
delete[] colIndices;
delete[] rowPointers;
}
/// Converts this matrix to the dataformat used by the FPGA.
/// The FPGA uses a new data format called CSRO (Compressed Sparse Row Offset).
/// The purpose of this format is to allow the data to be streamable.
/// The rowPointers array has an unpredictable reading pattern/timing,
/// it also needs a extra work if a row is shorter than a cacheline.
/// The array of N+1 rowPointers is replaced by an array of nnz rowOffsets.
/// The value of this offset is 0, unless the corresponding nnz is the first of a row,
/// in that case it is 'the number of empty rows preceeding it + 1'.
/// The FPGA can simply add the rowOffset to the current rowIdx to get the new rowIdx.
/// Example:
/// [1 0 0 3 0] nnzValues [1 3 2 2 1 4 3 4 1]
/// [0 2 2 0 1] colIndices [0 3 1 2 4 0 1 2 4]
/// [4 0 0 0 0] -> rowPointers [0 2 5 6 6 9]
/// [0 0 0 0 0] rowOffsets [1 0 1 0 0 1 2 0 0]
/// [0 3 4 0 1]
/// The rowOffset is stored in 1 byte, meaning the maximum value is 255.
int toRDF(int numColors, std::vector& nodesPerColor,
std::vector >& colIndicesInColor, int nnzsPerRowLimit,
std::vector >& ubNnzValues, short int *ubColIndices, int *nnzValsSizes, unsigned char *NROffsets, int *colorSizes);
double *nnzValues;
int *colIndices;
int *rowPointers;
int N;
int nnzs;
};
void sortRow(int *colIndices, double *data, int left, int right);
} // end namespace bda
#endif // FPGA_MATRIX_HEADER_INCLUDED