From 1f6d957cd4a518af7d3f881a7f734bd305d6b586 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Atgeirr=20Fl=C3=B8=20Rasmussen?= <atgeirr@sintef.no>
Date: Wed, 9 Sep 2015 10:22:25 +0200
Subject: [PATCH 1/4] Change the way the interleaved matrix is built.

Note that this implementation may not be robust since the getSparse()
method throws if the AutoDiffMatrix is not of general sparse type (S),
---
 opm/autodiff/AutoDiffMatrix.hpp               |  8 +++++++
 .../NewtonIterationBlackoilInterleaved.cpp    | 23 +++++++++++++++----
 2 files changed, 26 insertions(+), 5 deletions(-)
diff --git a/opm/autodiff/AutoDiffMatrix.hpp b/opm/autodiff/AutoDiffMatrix.hpp
index 18f86d624..9d0347c92 100644
--- a/opm/autodiff/AutoDiffMatrix.hpp
+++ b/opm/autodiff/AutoDiffMatrix.hpp
@@ -529,6 +529,14 @@ namespace Opm
             }
         }
 
+
+        const Sparse& getSparse() const {
+            if (type_ != S) {
+                OPM_THROW(std::logic_error, "Must not call getSparse() for non-sparse type.");
+            }
+            return sparse_;
+        }
+
     private:
         enum MatrixType { Z, I, D, S };
         MatrixType type_;
diff --git a/opm/autodiff/NewtonIterationBlackoilInterleaved.cpp b/opm/autodiff/NewtonIterationBlackoilInterleaved.cpp
index 298136521..b5fb4349d 100644
--- a/opm/autodiff/NewtonIterationBlackoilInterleaved.cpp
+++ b/opm/autodiff/NewtonIterationBlackoilInterleaved.cpp
@@ -233,17 +233,30 @@ namespace Opm
             }
         }
 
+        // Set all blocks to zero.
         const int size = s.rows();
+        assert(size == s.cols());
         for (int row = 0; row < size; ++row) {
             for (int col_ix = ia[row]; col_ix < ia[row + 1]; ++col_ix) {
                 const int col = ja[col_ix];
-                MatrixBlockType block;
-                for (int p1 = 0; p1 < np; ++p1) {
-                    for (int p2 = 0; p2 < np; ++p2) {
-                        block[p1][p2] = eqs[p1].derivative()[p2].coeff(row, col);
+                istlA[row][col] = 0.0;
+            }
+        }
+
+        // Go through all jacobians, insert in correct spot
+        for (int col = 0; col < size; ++col) {
+            for (int p1 = 0; p1 < np; ++p1) {
+                for (int p2 = 0; p2 < np; ++p2) {
+                    // Note that that since these are CSC and not CSR matrices,
+                    // ja contains row numbers instead of column numbers.
+                    const int* ia = eqs[p1].derivative()[p2].getSparse().outerIndexPtr();
+                    const int* ja = eqs[p1].derivative()[p2].getSparse().innerIndexPtr();
+                    const double* sa = eqs[p1].derivative()[p2].getSparse().valuePtr();
+                    for (int elem_ix = ia[col]; elem_ix < ia[col + 1]; ++elem_ix) {
+                        const int row = ja[elem_ix];
+                        istlA[row][col][p1][p2] = sa[elem_ix];
                     }
                 }
-                istlA[row][col] = block;
             }
         }
     }

From a58dcce654e744299a37698cdb0826e75c343d7c Mon Sep 17 00:00:00 2001
From: babrodtk <andre.brodtkorb@sintef.no>
Date: Thu, 17 Sep 2015 13:46:05 +0200
Subject: [PATCH 2/4] Minor changes to how the interleaved system is built

---
 opm/autodiff/AutoDiffMatrix.hpp               | 202 +++++++++---------
 .../NewtonIterationBlackoilInterleaved.cpp    |  45 ++--
 2 files changed, 132 insertions(+), 115 deletions(-)

diff --git a/opm/autodiff/AutoDiffMatrix.hpp b/opm/autodiff/AutoDiffMatrix.hpp
index 9d0347c92..8b1a5b88d 100644
--- a/opm/autodiff/AutoDiffMatrix.hpp
+++ b/opm/autodiff/AutoDiffMatrix.hpp
@@ -38,11 +38,12 @@ namespace Opm
     class AutoDiffMatrix
     {
     public:
-        typedef std::vector<double> Diag;
-        typedef Eigen::SparseMatrix<double> Sparse;
+        typedef std::vector<double> DiagRep;
+        typedef Eigen::SparseMatrix<double> SparseRep;
+
 
         AutoDiffMatrix()
-            : type_(Z),
+            : type_(Zero),
               rows_(0),
               cols_(0),
               diag_(),
@@ -53,7 +54,7 @@ namespace Opm
 
 
         AutoDiffMatrix(const int num_rows, const int num_cols)
-            : type_(Z),
+            : type_(Zero),
               rows_(num_rows),
               cols_(num_cols),
               diag_(),
@@ -67,7 +68,7 @@ namespace Opm
 
 
         AutoDiffMatrix(const CreationType t, const int num_rows)
-            : type_(t == ZeroMatrix ? Z : I),
+            : type_(t == ZeroMatrix ? Zero : Identity),
               rows_(num_rows),
               cols_(num_rows),
               diag_(),
@@ -78,7 +79,7 @@ namespace Opm
 
 
         explicit AutoDiffMatrix(const Eigen::DiagonalMatrix<double, Eigen::Dynamic>& d)
-            : type_(D),
+            : type_(Diagonal),
               rows_(d.rows()),
               cols_(d.cols()),
               diag_(d.diagonal().array().data(), d.diagonal().array().data() + d.rows()),
@@ -90,7 +91,7 @@ namespace Opm
 
 
         explicit AutoDiffMatrix(const Eigen::SparseMatrix<double>& s)
-            : type_(S),
+            : type_(Sparse),
               rows_(s.rows()),
               cols_(s.cols()),
               diag_(),
@@ -106,7 +107,7 @@ namespace Opm
 
 
         AutoDiffMatrix(AutoDiffMatrix&& other)
-            : type_(Z),
+            : type_(Zero),
               rows_(0),
               cols_(0),
               diag_(),
@@ -141,43 +142,43 @@ namespace Opm
             assert(rows_ == rhs.rows_);
             assert(cols_ == rhs.cols_);
             switch (type_) {
-            case Z:
+            case Zero:
                 return rhs;
-            case I:
+            case Identity:
                 switch (rhs.type_) {
-                case Z:
+                case Zero:
                     return *this;
-                case I:
+                case Identity:
                     return addII(*this, rhs);
-                case D:
+                case Diagonal:
                     return addDI(rhs, *this);
-                case S:
+                case Sparse:
                     return addSI(rhs, *this);
                 default:
                     OPM_THROW(std::logic_error, "Invalid AutoDiffMatrix type encountered: " << rhs.type_);
                 }
-            case D:
+            case Diagonal:
                 switch (rhs.type_) {
-                case Z:
+                case Zero:
                     return *this;
-                case I:
+                case Identity:
                     return addDI(*this, rhs);
-                case D:
+                case Diagonal:
                     return addDD(*this, rhs);
-                case S:
+                case Sparse:
                     return addSD(rhs, *this);
                 default:
                     OPM_THROW(std::logic_error, "Invalid AutoDiffMatrix type encountered: " << rhs.type_);
                 }
-            case S:
+            case Sparse:
                 switch (rhs.type_) {
-                case Z:
+                case Zero:
                     return *this;
-                case I:
+                case Identity:
                     return addSI(*this, rhs);
-                case D:
+                case Diagonal:
                     return addSD(*this, rhs);
-                case S:
+                case Sparse:
                     return addSS(*this, rhs);
                 default:
                     OPM_THROW(std::logic_error, "Invalid AutoDiffMatrix type encountered: " << rhs.type_);
@@ -191,32 +192,32 @@ namespace Opm
         {
             assert(cols_ == rhs.rows_);
             switch (type_) {
-            case Z:
+            case Zero:
                 return AutoDiffMatrix(rows_, rhs.cols_);
-            case I:
+            case Identity:
                 return rhs;
-            case D:
+            case Diagonal:
                 switch (rhs.type_) {
-                case Z:
+                case Zero:
                     return AutoDiffMatrix(rows_, rhs.cols_);
-                case I:
+                case Identity:
                     return *this;
-                case D:
+                case Diagonal:
                     return mulDD(*this, rhs);
-                case S:
+                case Sparse:
                     return mulDS(*this, rhs);
                 default:
                     OPM_THROW(std::logic_error, "Invalid AutoDiffMatrix type encountered: " << rhs.type_);
                 }
-            case S:
+            case Sparse:
                 switch (rhs.type_) {
-                case Z:
+                case Zero:
                     return AutoDiffMatrix(rows_, rhs.cols_);
-                case I:
+                case Identity:
                     return *this;
-                case D:
+                case Diagonal:
                     return mulSD(*this, rhs);
-                case S:
+                case Sparse:
                     return mulSS(*this, rhs);
                 default:
                     OPM_THROW(std::logic_error, "Invalid AutoDiffMatrix type encountered: " << rhs.type_);
@@ -257,16 +258,16 @@ namespace Opm
         AutoDiffMatrix operator*(const double rhs) const
         {
             switch (type_) {
-            case Z:
+            case Zero:
                 return *this;
-            case I:
+            case Identity:
                 {
                     AutoDiffMatrix retval(*this);
-                    retval.type_ = D;
+                    retval.type_ = Diagonal;
                     retval.diag_.assign(rows_, rhs);
                     return retval;
                 }
-            case D:
+            case Diagonal:
                 {
                     AutoDiffMatrix retval(*this);
                     for (double& elem : retval.diag_) {
@@ -274,7 +275,7 @@ namespace Opm
                     }
                     return retval;
                 }
-            case S:
+            case Sparse:
                 {
                     AutoDiffMatrix retval(*this);
                     retval.sparse_ *= rhs;
@@ -293,16 +294,16 @@ namespace Opm
         AutoDiffMatrix operator/(const double rhs) const
         {
             switch (type_) {
-            case Z:
+            case Zero:
                 return *this;
-            case I:
+            case Identity:
                 {
                     AutoDiffMatrix retval(*this);
-                    retval.type_ = D;
+                    retval.type_ = Diagonal;
                     retval.diag_.assign(rows_, 1.0/rhs);
                     return retval;
                 }
-            case D:
+            case Diagonal:
                 {
                     AutoDiffMatrix retval(*this);
                     for (double& elem : retval.diag_) {
@@ -310,7 +311,7 @@ namespace Opm
                     }
                     return retval;
                 }
-            case S:
+            case Sparse:
                 {
                     AutoDiffMatrix retval(*this);
                     retval.sparse_ /= rhs;
@@ -330,16 +331,16 @@ namespace Opm
         {
             assert(cols_ == rhs.size());
             switch (type_) {
-            case Z:
+            case Zero:
                 return Eigen::VectorXd::Zero(rows_);
-            case I:
+            case Identity:
                 return rhs;
-            case D:
+            case Diagonal:
                 {
                     const Eigen::VectorXd d = Eigen::Map<const Eigen::VectorXd>(diag_.data(), rows_);
                     return d.cwiseProduct(rhs);
                 }
-            case S:
+            case Sparse:
                 return sparse_ * rhs;
             default:
                 OPM_THROW(std::logic_error, "Invalid AutoDiffMatrix type encountered: " << type_);
@@ -353,10 +354,10 @@ namespace Opm
 
         static AutoDiffMatrix addII(const AutoDiffMatrix& lhs, const AutoDiffMatrix& rhs)
         {
-            assert(lhs.type_ == I);
-            assert(rhs.type_ == I);
+            assert(lhs.type_ == Identity);
+            assert(rhs.type_ == Identity);
             AutoDiffMatrix retval;
-            retval.type_ = D;
+            retval.type_ = Diagonal;
             retval.rows_ = lhs.rows_;
             retval.cols_ = rhs.cols_;
             retval.diag_.assign(lhs.rows_, 2.0);
@@ -366,8 +367,8 @@ namespace Opm
         static AutoDiffMatrix addDI(const AutoDiffMatrix& lhs, const AutoDiffMatrix& rhs)
         {
             static_cast<void>(rhs); // Silence release-mode warning.
-            assert(lhs.type_ == D);
-            assert(rhs.type_ == I);
+            assert(lhs.type_ == Diagonal);
+            assert(rhs.type_ == Identity);
             AutoDiffMatrix retval = lhs;
             for (int r = 0; r < lhs.rows_; ++r) {
                 retval.diag_[r] += 1.0;
@@ -377,8 +378,8 @@ namespace Opm
 
         static AutoDiffMatrix addDD(const AutoDiffMatrix& lhs, const AutoDiffMatrix& rhs)
         {
-            assert(lhs.type_ == D);
-            assert(rhs.type_ == D);
+            assert(lhs.type_ == Diagonal);
+            assert(rhs.type_ == Diagonal);
             AutoDiffMatrix retval = lhs;
             for (int r = 0; r < lhs.rows_; ++r) {
                 retval.diag_[r] += rhs.diag_[r];
@@ -389,8 +390,8 @@ namespace Opm
         static AutoDiffMatrix addSI(const AutoDiffMatrix& lhs, const AutoDiffMatrix& rhs)
         {
             static_cast<void>(rhs); // Silence release-mode warning.
-            assert(lhs.type_ == S);
-            assert(rhs.type_ == I);
+            assert(lhs.type_ == Sparse);
+            assert(rhs.type_ == Identity);
             AutoDiffMatrix retval = lhs;
             retval.sparse_ += spdiag(Eigen::VectorXd::Ones(lhs.rows_));;
             return retval;
@@ -398,8 +399,8 @@ namespace Opm
 
         static AutoDiffMatrix addSD(const AutoDiffMatrix& lhs, const AutoDiffMatrix& rhs)
         {
-            assert(lhs.type_ == S);
-            assert(rhs.type_ == D);
+            assert(lhs.type_ == Sparse);
+            assert(rhs.type_ == Diagonal);
             AutoDiffMatrix retval = lhs;
             retval.sparse_ += spdiag(rhs.diag_);
             return retval;
@@ -407,8 +408,8 @@ namespace Opm
 
         static AutoDiffMatrix addSS(const AutoDiffMatrix& lhs, const AutoDiffMatrix& rhs)
         {
-            assert(lhs.type_ == S);
-            assert(rhs.type_ == S);
+            assert(lhs.type_ == Sparse);
+            assert(rhs.type_ == Sparse);
             AutoDiffMatrix retval = lhs;
             retval.sparse_ += rhs.sparse_;
             return retval;
@@ -420,8 +421,8 @@ namespace Opm
 
         static AutoDiffMatrix mulDD(const AutoDiffMatrix& lhs, const AutoDiffMatrix& rhs)
         {
-            assert(lhs.type_ == D);
-            assert(rhs.type_ == D);
+            assert(lhs.type_ == Diagonal);
+            assert(rhs.type_ == Diagonal);
             AutoDiffMatrix retval = lhs;
             for (int r = 0; r < lhs.rows_; ++r) {
                 retval.diag_[r] *= rhs.diag_[r];
@@ -431,10 +432,10 @@ namespace Opm
 
         static AutoDiffMatrix mulDS(const AutoDiffMatrix& lhs, const AutoDiffMatrix& rhs)
         {
-            assert(lhs.type_ == D);
-            assert(rhs.type_ == S);
+            assert(lhs.type_ == Diagonal);
+            assert(rhs.type_ == Sparse);
             AutoDiffMatrix retval;
-            retval.type_ = S;
+            retval.type_ = Sparse;
             retval.rows_ = lhs.rows_;
             retval.cols_ = rhs.cols_;
             fastDiagSparseProduct(lhs.diag_, rhs.sparse_, retval.sparse_);
@@ -443,10 +444,10 @@ namespace Opm
 
         static AutoDiffMatrix mulSD(const AutoDiffMatrix& lhs, const AutoDiffMatrix& rhs)
         {
-            assert(lhs.type_ == S);
-            assert(rhs.type_ == D);
+            assert(lhs.type_ == Sparse);
+            assert(rhs.type_ == Diagonal);
             AutoDiffMatrix retval;
-            retval.type_ = S;
+            retval.type_ = Sparse;
             retval.rows_ = lhs.rows_;
             retval.cols_ = rhs.cols_;
             fastSparseDiagProduct(lhs.sparse_, rhs.diag_, retval.sparse_);
@@ -455,10 +456,10 @@ namespace Opm
 
         static AutoDiffMatrix mulSS(const AutoDiffMatrix& lhs, const AutoDiffMatrix& rhs)
         {
-            assert(lhs.type_ == S);
-            assert(rhs.type_ == S);
+            assert(lhs.type_ == Sparse);
+            assert(rhs.type_ == Sparse);
             AutoDiffMatrix retval;
-            retval.type_ = S;
+            retval.type_ = Sparse;
             retval.rows_ = lhs.rows_;
             retval.cols_ = rhs.cols_;
             fastSparseProduct(lhs.sparse_, rhs.sparse_, retval.sparse_);
@@ -470,16 +471,16 @@ namespace Opm
         void toSparse(Eigen::SparseMatrix<Scalar, Options, Index>& s) const
         {
             switch (type_) {
-            case Z:
+            case Zero:
                 s = Eigen::SparseMatrix<Scalar, Options, Index>(rows_, cols_);
                 return;
-            case I:
+            case Identity:
                 s = spdiag(Eigen::VectorXd::Ones(rows_));
                 return;
-            case D:
+            case Diagonal:
                 s = spdiag(diag_);
                 return;
-            case S:
+            case Sparse:
                 s = sparse_;
                 return;
             }
@@ -499,13 +500,13 @@ namespace Opm
         int nonZeros() const
         {
             switch (type_) {
-            case Z:
+            case Zero:
                 return 0;
-            case I:
+            case Identity:
                 return rows_;
-            case D:
+            case Diagonal:
                 return rows_;
-            case S:
+            case Sparse:
                 return sparse_.nonZeros();
             default:
                 OPM_THROW(std::logic_error, "Invalid AutoDiffMatrix type encountered: " << type_);
@@ -516,44 +517,51 @@ namespace Opm
         double coeff(const int row, const int col) const
         {
             switch (type_) {
-            case Z:
+            case Zero:
                 return 0.0;
-            case I:
+            case Identity:
                 return (row == col) ? 1.0 : 0.0;
-            case D:
+            case Diagonal:
                 return (row == col) ? diag_[row] : 0.0;
-            case S:
+            case Sparse:
                 return sparse_.coeff(row, col);
             default:
                 OPM_THROW(std::logic_error, "Invalid AutoDiffMatrix type encountered: " << type_);
             }
         }
 
-
-        const Sparse& getSparse() const {
-            if (type_ != S) {
-                OPM_THROW(std::logic_error, "Must not call getSparse() for non-sparse type.");
+        const SparseRep& getSparse() const {
+            if (type_ != Sparse) {
+                /**
+                 * If we are not a sparse matrix, our internal variable sparse_
+                 * is undefined, and hence changing it so that it happens to be
+                 * a sparse representation of our true data does not change our
+                 * true data, and hence justifies that we do not really violate
+                 * the const qualifier.
+                 */
+                SparseRep& mutable_sparse = const_cast<SparseRep&>(sparse_);
+                toSparse(mutable_sparse);
             }
             return sparse_;
         }
 
     private:
-        enum MatrixType { Z, I, D, S };
-        MatrixType type_;
+        enum AudoDiffMatrixType { Zero, Identity, Diagonal, Sparse };
+        AudoDiffMatrixType type_;
         int rows_;
         int cols_;
-        Diag diag_;
-        Sparse sparse_;
+        DiagRep diag_;
+        SparseRep sparse_;
 
         template <class V>
         static inline
-        Sparse
+        SparseRep
         spdiag(const V& d)
         {
             const int n = d.size();
-            Sparse mat(n, n);
+            SparseRep mat(n, n);
             mat.reserve(Eigen::ArrayXi::Ones(n, 1));
-            for (Sparse::Index i = 0; i < n; ++i) {
+            for (SparseRep::Index i = 0; i < n; ++i) {
                 if (d[i] != 0.0) {
                     mat.insert(i, i) = d[i];
                 }
diff --git a/opm/autodiff/NewtonIterationBlackoilInterleaved.cpp b/opm/autodiff/NewtonIterationBlackoilInterleaved.cpp
index b5fb4349d..c9fc97fc5 100644
--- a/opm/autodiff/NewtonIterationBlackoilInterleaved.cpp
+++ b/opm/autodiff/NewtonIterationBlackoilInterleaved.cpp
@@ -198,28 +198,38 @@ namespace Opm
 
 
 
+    namespace detail {
+        /**
+         * Simple binary operator that always returns 0.1
+         * It is used to get the sparsity pattern for our
+         * interleaved system, and is marginally faster than using
+         * operator+=.
+         */
+        template<typename Scalar> struct PointOneOp {
+            EIGEN_EMPTY_STRUCT_CTOR(PointOneOp)
+            Scalar operator()(const Scalar& a, const Scalar& b) const { return 0.1; }
+        };
+    }
+
 
     void NewtonIterationBlackoilInterleaved::formInterleavedSystem(const std::vector<ADB>& eqs,
                                                                    Mat& istlA) const
-    {
+   {
         const int np = eqs.size();
-
         // Find sparsity structure as union of basic block sparsity structures,
         // corresponding to the jacobians with respect to pressure.
         // Use addition to get to the union structure.
-        typedef Eigen::SparseMatrix<double> Sp;
-        Sp structure;
-        eqs[0].derivative()[0].toSparse(structure);
-        {
-            Sp s0;
-            for (int phase = 1; phase < np; ++phase) {
-                eqs[phase].derivative()[0].toSparse(s0);
-                structure += s0;
-            }
+        AutoDiffMatrix::SparseRep structure = eqs[0].derivative()[0].getSparse();
+        detail::PointOneOp<double> point_one;
+        for (int phase = 1; phase < np; ++phase) {
+            const AutoDiffMatrix::SparseRep& mat = eqs[phase].derivative()[0].getSparse();
+            structure = structure.binaryExpr(mat, point_one);
         }
-
         Eigen::SparseMatrix<double, Eigen::RowMajor> s = structure;
 
+        const int size = s.rows();
+        assert(size == s.cols());
+
         // Create ISTL matrix with interleaved rows and columns (block structured).
         assert(np == 3);
         istlA.setSize(s.rows(), s.cols(), s.nonZeros());
@@ -227,15 +237,13 @@ namespace Opm
         const int* ia = s.outerIndexPtr();
         const int* ja = s.innerIndexPtr();
         for (Mat::CreateIterator row = istlA.createbegin(); row != istlA.createend(); ++row) {
-            int ri = row.index();
+            const int ri = row.index();
             for (int i = ia[ri]; i < ia[ri + 1]; ++i) {
                 row.insert(ja[i]);
             }
         }
 
         // Set all blocks to zero.
-        const int size = s.rows();
-        assert(size == s.cols());
         for (int row = 0; row < size; ++row) {
             for (int col_ix = ia[row]; col_ix < ia[row + 1]; ++col_ix) {
                 const int col = ja[col_ix];
@@ -249,9 +257,10 @@ namespace Opm
                 for (int p2 = 0; p2 < np; ++p2) {
                     // Note that that since these are CSC and not CSR matrices,
                     // ja contains row numbers instead of column numbers.
-                    const int* ia = eqs[p1].derivative()[p2].getSparse().outerIndexPtr();
-                    const int* ja = eqs[p1].derivative()[p2].getSparse().innerIndexPtr();
-                    const double* sa = eqs[p1].derivative()[p2].getSparse().valuePtr();
+                    const AutoDiffMatrix::SparseRep& s = eqs[p1].derivative()[p2].getSparse();
+                    const int* ia = s.outerIndexPtr();
+                    const int* ja = s.innerIndexPtr();
+                    const double* sa = s.valuePtr();
                     for (int elem_ix = ia[col]; elem_ix < ia[col + 1]; ++elem_ix) {
                         const int row = ja[elem_ix];
                         istlA[row][col][p1][p2] = sa[elem_ix];

From 206dbd3b56e1be72ca7fc3bb65f7b6fb5d85ace2 Mon Sep 17 00:00:00 2001
From: babrodtk <andre.brodtkorb@sintef.no>
Date: Mon, 21 Sep 2015 08:28:57 +0200
Subject: [PATCH 3/4] Updated documentation

---
 .../NewtonIterationBlackoilInterleaved.cpp    | 33 +++++++++++++------
 1 file changed, 23 insertions(+), 10 deletions(-)

diff --git a/opm/autodiff/NewtonIterationBlackoilInterleaved.cpp b/opm/autodiff/NewtonIterationBlackoilInterleaved.cpp
index c9fc97fc5..252681e4b 100644
--- a/opm/autodiff/NewtonIterationBlackoilInterleaved.cpp
+++ b/opm/autodiff/NewtonIterationBlackoilInterleaved.cpp
@@ -218,24 +218,27 @@ namespace Opm
         const int np = eqs.size();
         // Find sparsity structure as union of basic block sparsity structures,
         // corresponding to the jacobians with respect to pressure.
-        // Use addition to get to the union structure.
-        AutoDiffMatrix::SparseRep structure = eqs[0].derivative()[0].getSparse();
+        // Use our custom PointOneOp to get to the union structure.
+        // Note that we only iterate over the pressure derivatives on purpose.
+        Eigen::SparseMatrix<double, Eigen::ColMajor> col_major = eqs[0].derivative()[0].getSparse();
         detail::PointOneOp<double> point_one;
         for (int phase = 1; phase < np; ++phase) {
             const AutoDiffMatrix::SparseRep& mat = eqs[phase].derivative()[0].getSparse();
-            structure = structure.binaryExpr(mat, point_one);
+            col_major = col_major.binaryExpr(mat, point_one);
         }
-        Eigen::SparseMatrix<double, Eigen::RowMajor> s = structure;
 
-        const int size = s.rows();
-        assert(size == s.cols());
+        // Automatically convert the column major structure to a row-major structure
+        Eigen::SparseMatrix<double, Eigen::RowMajor> row_major = col_major;
+
+        const int size = row_major.rows();
+        assert(size == row_major.cols());
 
         // Create ISTL matrix with interleaved rows and columns (block structured).
         assert(np == 3);
-        istlA.setSize(s.rows(), s.cols(), s.nonZeros());
+        istlA.setSize(row_major.rows(), row_major.cols(), row_major.nonZeros());
         istlA.setBuildMode(Mat::row_wise);
-        const int* ia = s.outerIndexPtr();
-        const int* ja = s.innerIndexPtr();
+        const int* ia = row_major.outerIndexPtr();
+        const int* ja = row_major.innerIndexPtr();
         for (Mat::CreateIterator row = istlA.createbegin(); row != istlA.createend(); ++row) {
             const int ri = row.index();
             for (int i = ia[ri]; i < ia[ri + 1]; ++i) {
@@ -251,7 +254,17 @@ namespace Opm
             }
         }
 
-        // Go through all jacobians, insert in correct spot
+        /**
+         * Go through all jacobians, and insert in correct spot
+         *
+         * The straight forward way to do this would be to run through each
+         * element in the output matrix, and set all block entries by gathering
+         * from all "input matrices" (derivatives).
+         *
+         * A faster alternative is to instead run through each "input matrix" and
+         * insert its elements in the correct spot in the output matrix.
+         *
+         */
         for (int col = 0; col < size; ++col) {
             for (int p1 = 0; p1 < np; ++p1) {
                 for (int p2 = 0; p2 < np; ++p2) {

From 85cfd9768eb8959ff00dfcd2c0f84449c7175455 Mon Sep 17 00:00:00 2001
From: babrodtk <andre.brodtkorb@sintef.no>
Date: Thu, 24 Sep 2015 08:47:27 +0200
Subject: [PATCH 4/4] Fixed whitespace issue

---
 opm/autodiff/NewtonIterationBlackoilInterleaved.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/opm/autodiff/NewtonIterationBlackoilInterleaved.cpp b/opm/autodiff/NewtonIterationBlackoilInterleaved.cpp
index 252681e4b..2ef9055fb 100644
--- a/opm/autodiff/NewtonIterationBlackoilInterleaved.cpp
+++ b/opm/autodiff/NewtonIterationBlackoilInterleaved.cpp
@@ -214,7 +214,7 @@ namespace Opm
 
     void NewtonIterationBlackoilInterleaved::formInterleavedSystem(const std::vector<ADB>& eqs,
                                                                    Mat& istlA) const
-   {
+    {
         const int np = eqs.size();
         // Find sparsity structure as union of basic block sparsity structures,
         // corresponding to the jacobians with respect to pressure.