GCC Code Coverage Report

Directory:	./
File:	openvdb/openvdb/math/ConjGradient.h
Date:	2022-07-25 17:40:05
	Exec	Total	Coverage
Lines:	361	382	94.5%
Functions:	54	56	96.4%
Branches:	302	631	47.9%
  
      Line
      Branch
      Exec
      Source
    
      // Copyright Contributors to the OpenVDB Project
    
      // SPDX-License-Identifier: MPL-2.0
    
      /// @file    ConjGradient.h
    
      /// @authors D.J. Hill, Peter Cucka
    
      /// @brief   Preconditioned conjugate gradient solver (solves @e Ax = @e b using
    
      ///          the conjugate gradient method with one of a selection of preconditioners)
    
      #ifndef OPENVDB_MATH_CONJGRADIENT_HAS_BEEN_INCLUDED
    
      #define OPENVDB_MATH_CONJGRADIENT_HAS_BEEN_INCLUDED
    
      #include <openvdb/Exceptions.h>
    
      #include <openvdb/Types.h>
    
      #include <openvdb/util/logging.h>
    
      #include <openvdb/util/NullInterrupter.h>
    
      #include "Math.h" // for Abs(), isZero(), Max(), Sqrt()
    
      #include <tbb/parallel_for.h>
    
      #include <tbb/parallel_reduce.h>
    
      #include <algorithm> // for std::lower_bound()
    
      #include <cassert>
    
      #include <cmath> // for std::isfinite()
    
      #include <limits>
    
      #include <sstream>
    
      #include <string>
    
      namespace openvdb {
    
      OPENVDB_USE_VERSION_NAMESPACE
    
      namespace OPENVDB_VERSION_NAME {
    
      namespace math {
    
      namespace pcg {
    
      using SizeType = Index32;
    
      using SizeRange = tbb::blocked_range<SizeType>;
    
      template<typename ValueType> class Vector;
    
      template<typename ValueType, SizeType STENCIL_SIZE> class SparseStencilMatrix;
    
      template<typename ValueType> class Preconditioner;
    
      template<typename MatrixType> class JacobiPreconditioner;
    
      template<typename MatrixType> class IncompleteCholeskyPreconditioner;
    
      /// Information about the state of a conjugate gradient solution
    
      struct State {
    
          bool    success;
    
          int     iterations;
    
          double  relativeError;
    
          double  absoluteError;
    
      };
    
      /// Return default termination conditions for a conjugate gradient solver.
    
      template<typename ValueType>
    
      inline State
    
      terminationDefaults()
    
      {
    
          State s;
    
        4/8✓ Branch 1 taken 1 times.
✗ Branch 2 not taken.
✓ Branch 4 taken 1 times.
✗ Branch 5 not taken.
✓ Branch 7 taken 1 times.
✗ Branch 8 not taken.
✓ Branch 10 taken 1 times.
✗ Branch 11 not taken.

      9
          s.success = false;
    
      2
          s.iterations = 50;
    
        3/6✓ Branch 1 taken 1 times.
✗ Branch 2 not taken.
✓ Branch 4 taken 1 times.
✗ Branch 5 not taken.
✓ Branch 7 taken 1 times.
✗ Branch 8 not taken.

      5
          s.relativeError = 1.0e-6;
    
      2
          s.absoluteError = std::numeric_limits<ValueType>::epsilon() * 100.0;
    
          return s;
    
      }
    
      ////////////////////////////////////////
    
      /// @brief Solve @e Ax = @e b via the preconditioned conjugate gradient method.
    
      ///
    
      /// @param A  a symmetric, positive-definite, @e N x @e N matrix
    
      /// @param b  a vector of size @e N
    
      /// @param x  a vector of size @e N
    
      /// @param preconditioner  a Preconditioner matrix
    
      /// @param termination  termination conditions given as a State object with the following fields:
    
      ///     <dl>
    
      ///     <dt><i>success</i>
    
      ///     <dd>ignored
    
      ///     <dt><i>iterations</i>
    
      ///     <dd>the maximum number of iterations, with or without convergence
    
      ///     <dt><i>relativeError</i>
    
      ///     <dd>the relative error ||<i>b</i> &minus; <i>Ax</i>|| / ||<i>b</i>||
    
      ///         that denotes convergence
    
      ///     <dt><i>absoluteError</i>
    
      ///     <dd>the absolute error ||<i>b</i> &minus; <i>Ax</i>|| that denotes convergence
    
      ///
    
      /// @throw ArithmeticError if either @a x or @a b is not of the appropriate size.
    
      template<typename PositiveDefMatrix>
    
      inline State
    
      solve(
    
          const PositiveDefMatrix& A,
    
          const Vector<typename PositiveDefMatrix::ValueType>& b,
    
          Vector<typename PositiveDefMatrix::ValueType>& x,
    
          Preconditioner<typename PositiveDefMatrix::ValueType>& preconditioner,
    
          const State& termination = terminationDefaults<typename PositiveDefMatrix::ValueType>());
    
      /// @brief Solve @e Ax = @e b via the preconditioned conjugate gradient method.
    
      ///
    
      /// @param A  a symmetric, positive-definite, @e N x @e N matrix
    
      /// @param b  a vector of size @e N
    
      /// @param x  a vector of size @e N
    
      /// @param preconditioner  a Preconditioner matrix
    
      /// @param termination  termination conditions given as a State object with the following fields:
    
      ///     <dl>
    
      ///     <dt><i>success</i>
    
      ///     <dd>ignored
    
      ///     <dt><i>iterations</i>
    
      ///     <dd>the maximum number of iterations, with or without convergence
    
      ///     <dt><i>relativeError</i>
    
      ///     <dd>the relative error ||<i>b</i> &minus; <i>Ax</i>|| / ||<i>b</i>||
    
      ///         that denotes convergence
    
      ///     <dt><i>absoluteError</i>
    
      ///     <dd>the absolute error ||<i>b</i> &minus; <i>Ax</i>|| that denotes convergence
    
      /// @param interrupter  an object adhering to the util::NullInterrupter interface
    
      ///     with which computation can be interrupted
    
      ///
    
      /// @throw ArithmeticError if either @a x or @a b is not of the appropriate size.
    
      /// @throw RuntimeError if the computation is interrupted.
    
      template<typename PositiveDefMatrix, typename Interrupter>
    
      inline State
    
      solve(
    
          const PositiveDefMatrix& A,
    
          const Vector<typename PositiveDefMatrix::ValueType>& b,
    
          Vector<typename PositiveDefMatrix::ValueType>& x,
    
          Preconditioner<typename PositiveDefMatrix::ValueType>& preconditioner,
    
          Interrupter& interrupter,
    
          const State& termination = terminationDefaults<typename PositiveDefMatrix::ValueType>());
    
      ////////////////////////////////////////
    
      /// Lightweight, variable-length vector
    
      template<typename T>
    
      class Vector
    
      {
    
      public:
    
          using ValueType = T;
    
          using Ptr = SharedPtr<Vector>;
    
          /// Construct an empty vector.
    
          Vector(): mData(nullptr), mSize(0) {}
    
          /// Construct a vector of @a n elements, with uninitialized values.
    
        12/24✓ Branch 1 taken 1 times.
✓ Branch 2 taken 9 times.
✗ Branch 3 not taken.
✓ Branch 5 taken 11 times.
✗ Branch 6 not taken.
✗ Branch 7 not taken.
✓ Branch 8 taken 9 times.
✗ Branch 9 not taken.
✗ Branch 10 not taken.
✓ Branch 11 taken 1 times.
✗ Branch 12 not taken.
✗ Branch 13 not taken.
✓ Branch 14 taken 1 times.
✓ Branch 15 taken 3 times.
✗ Branch 16 not taken.
✓ Branch 17 taken 1 times.
✗ Branch 18 not taken.
✓ Branch 19 taken 1 times.
✓ Branch 20 taken 3 times.
✗ Branch 21 not taken.
✓ Branch 23 taken 3 times.
✗ Branch 24 not taken.
✓ Branch 27 taken 2 times.
✗ Branch 28 not taken.

      34
          Vector(SizeType n): mData(new T[n]), mSize(n) {}
    
          /// Construct a vector of @a n elements and initialize each element to the given value.
    
      15
          Vector(SizeType n, const ValueType& val): mData(new T[n]), mSize(n) { this->fill(val); }
    
        18/72✓ Branch 0 taken 3 times.
✗ Branch 1 not taken.
✓ Branch 3 taken 9 times.
✓ Branch 4 taken 14 times.
✗ Branch 5 not taken.
✓ Branch 6 taken 9 times.
✗ Branch 7 not taken.
✗ Branch 8 not taken.
✓ Branch 9 taken 9 times.
✗ Branch 10 not taken.
✗ Branch 11 not taken.
✓ Branch 12 taken 9 times.
✗ Branch 13 not taken.
✗ Branch 14 not taken.
✗ Branch 15 not taken.
✗ Branch 16 not taken.
✗ Branch 17 not taken.
✗ Branch 18 not taken.
✗ Branch 19 not taken.
✗ Branch 20 not taken.
✗ Branch 21 not taken.
✗ Branch 22 not taken.
✗ Branch 23 not taken.
✗ Branch 24 not taken.
✗ Branch 25 not taken.
✗ Branch 26 not taken.
✓ Branch 27 taken 1 times.
✗ Branch 28 not taken.
✗ Branch 29 not taken.
✓ Branch 30 taken 1 times.
✗ Branch 31 not taken.
✗ Branch 32 not taken.
✓ Branch 33 taken 1 times.
✗ Branch 34 not taken.
✗ Branch 35 not taken.
✓ Branch 36 taken 1 times.
✗ Branch 37 not taken.
✗ Branch 38 not taken.
✗ Branch 39 not taken.
✗ Branch 40 not taken.
✗ Branch 42 not taken.
✓ Branch 43 taken 2 times.
✗ Branch 44 not taken.
✗ Branch 45 not taken.
✗ Branch 46 not taken.
✗ Branch 47 not taken.
✗ Branch 48 not taken.
✓ Branch 49 taken 2 times.
✗ Branch 50 not taken.
✓ Branch 51 taken 1 times.
✓ Branch 52 taken 2 times.
✗ Branch 53 not taken.
✓ Branch 54 taken 1 times.
✗ Branch 55 not taken.
✓ Branch 57 taken 1 times.
✗ Branch 58 not taken.
✗ Branch 61 not taken.
✗ Branch 62 not taken.
✗ Branch 64 not taken.
✗ Branch 65 not taken.
✗ Branch 67 not taken.
✗ Branch 68 not taken.
✓ Branch 72 taken 1 times.
✗ Branch 73 not taken.
✓ Branch 75 taken 1 times.
✗ Branch 76 not taken.
✗ Branch 80 not taken.
✗ Branch 81 not taken.
✗ Branch 83 not taken.
✗ Branch 84 not taken.
✗ Branch 86 not taken.
✗ Branch 87 not taken.

      43
          ~Vector() { mSize = 0; delete[] mData; mData = nullptr; }
    
          /// Deep copy the given vector.
    
          Vector(const Vector&);
    
          /// Deep copy the given vector.
    
          Vector& operator=(const Vector&);
    
          /// Return the number of elements in this vector.
    
        9/27✓ Branch 1 taken 1 times.
✗ Branch 2 not taken.
✓ Branch 4 taken 1 times.
✗ Branch 5 not taken.
✗ Branch 7 not taken.
✗ Branch 8 not taken.
✗ Branch 10 not taken.
✗ Branch 11 not taken.
✗ Branch 13 not taken.
✗ Branch 14 not taken.
✓ Branch 16 taken 2 times.
✗ Branch 17 not taken.
✓ Branch 19 taken 2 times.
✗ Branch 20 not taken.
✗ Branch 22 not taken.
✗ Branch 23 not taken.
✗ Branch 25 not taken.
✗ Branch 26 not taken.
✓ Branch 28 taken 2 times.
✗ Branch 29 not taken.
✓ Branch 31 taken 2 times.
✗ Branch 32 not taken.
✓ Branch 33 taken 7202 times.
✓ Branch 34 taken 3 times.
✗ Branch 35 not taken.
✓ Branch 36 taken 1 times.
✗ Branch 37 not taken.

      7216
          SizeType size() const { return mSize; }
    
          /// Return @c true if this vector has no elements.
    
          bool empty() const { return (mSize == 0); }
    
          /// @brief Reset this vector to have @a n elements, with uninitialized values.
    
          /// @warning All of this vector's existing values will be lost.
    
          void resize(SizeType n);
    
          /// Swap internal storage with another vector, which need not be the same size.
    
          void swap(Vector& other) { std::swap(mData, other.mData); std::swap(mSize, other.mSize); }
    
          /// Set all elements of this vector to @a value.
    
          void fill(const ValueType& value);
    
          //@{
    
          /// @brief Multiply each element of this vector by @a s.
    
          template<typename Scalar> void scale(const Scalar& s);
    
          template<typename Scalar> Vector& operator*=(const Scalar& s) { this->scale(s); return *this; }
    
          //@}
    
          /// Return the dot product of this vector with the given vector, which must be the same size.
    
          ValueType dot(const Vector&) const;
    
          /// Return the infinity norm of this vector.
    
          ValueType infNorm() const;
    
          /// Return the L2 norm of this vector.
    
      471
          ValueType l2Norm() const { return Sqrt(this->dot(*this)); }
    
          /// Return @c true if every element of this vector has a finite value.
    
          bool isFinite() const;
    
          /// @brief Return @c true if this vector is equivalent to the given vector
    
          /// to within the specified tolerance.
    
          template<typename OtherValueType>
    
          bool eq(const Vector<OtherValueType>& other,
    
              ValueType eps = Tolerance<ValueType>::value()) const;
    
          /// Return a string representation of this vector.
    
          std::string str() const;
    
          //@{
    
          /// @brief Return the value of this vector's ith element.
    
        20/50✓ Branch 1 taken 1 times.
✗ Branch 2 not taken.
✗ Branch 3 not taken.
✓ Branch 4 taken 1 times.
✗ Branch 5 not taken.
✗ Branch 6 not taken.
✗ Branch 7 not taken.
✓ Branch 8 taken 1457 times.
✗ Branch 9 not taken.
✗ Branch 10 not taken.
✓ Branch 11 taken 1457 times.
✗ Branch 12 not taken.
✗ Branch 13 not taken.
✓ Branch 14 taken 1922 times.
✗ Branch 15 not taken.
✗ Branch 16 not taken.
✓ Branch 17 taken 1922 times.
✗ Branch 18 not taken.
✗ Branch 19 not taken.
✓ Branch 20 taken 1457 times.
✗ Branch 21 not taken.
✓ Branch 23 taken 1457 times.
✗ Branch 24 not taken.
✗ Branch 25 not taken.
✓ Branch 27 taken 22418 times.
✗ Branch 28 not taken.
✓ Branch 30 taken 29620 times.
✗ Branch 31 not taken.
✓ Branch 33 taken 22418 times.
✗ Branch 34 not taken.
✓ Branch 36 taken 22418 times.
✗ Branch 37 not taken.
✓ Branch 39 taken 22418 times.
✗ Branch 40 not taken.
✓ Branch 42 taken 22418 times.
✗ Branch 43 not taken.
✗ Branch 47 not taken.
✗ Branch 48 not taken.
✓ Branch 50 taken 12418 times.
✗ Branch 51 not taken.
✓ Branch 53 taken 12418 times.
✗ Branch 54 not taken.
✓ Branch 56 taken 12418 times.
✗ Branch 57 not taken.
✓ Branch 59 taken 12418 times.
✗ Branch 60 not taken.
✓ Branch 62 taken 12418 times.
✗ Branch 63 not taken.
✓ Branch 65 taken 12418 times.
✗ Branch 66 not taken.

      4078523
          inline T& at(SizeType i) { return mData[i]; }
    
        1/2✓ Branch 4 taken 7202 times.
✗ Branch 5 not taken.

      3852433
          inline const T& at(SizeType i) const { return mData[i]; }
    
          inline T& operator[](SizeType i) { return this->at(i); }
    
          inline const T& operator[](SizeType i) const { return this->at(i); }
    
          //@}
    
          //@{
    
          /// @brief Return a pointer to this vector's elements.
    
      2825
          inline T* data() { return mData; }
    
      708006416
          inline const T* data() const { return mData; }
    
          inline const T* constData() const { return mData; }
    
          //@}
    
      private:
    
          // Functor for use with tbb::parallel_for()
    
          template<typename Scalar> struct ScaleOp;
    
          struct DeterministicDotProductOp;
    
          // Functors for use with tbb::parallel_reduce()
    
          template<typename OtherValueType> struct EqOp;
    
          struct InfNormOp;
    
          struct IsFiniteOp;
    
          T* mData;
    
          SizeType mSize;
    
      };
    
      using VectorS = Vector<float>;
    
      using VectorD = Vector<double>;
    
      ////////////////////////////////////////
    
      /// @brief Sparse, square matrix representing a 3D stencil operator of size @a STENCIL_SIZE
    
      /// @details The implementation is a variation on compressed row storage (CRS).
    
      template<typename ValueType_, SizeType STENCIL_SIZE>
    
      class SparseStencilMatrix
    
      {
    
      public:
    
          using ValueType = ValueType_;
    
          using VectorType = Vector<ValueType>;
    
          using Ptr = SharedPtr<SparseStencilMatrix>;
    
          class ConstValueIter;
    
          class ConstRow;
    
          class RowEditor;
    
          static const ValueType sZeroValue;
    
          /// Construct an @a n x @a n matrix with at most @a STENCIL_SIZE nonzero elements per row.
    
          SparseStencilMatrix(SizeType n);
    
          /// Deep copy the given matrix.
    
          SparseStencilMatrix(const SparseStencilMatrix&);
    
          //@{
    
          /// Return the number of rows in this matrix.
    
        1/2✓ Branch 1 taken 8 times.
✗ Branch 2 not taken.

      8
          SizeType numRows() const { return mNumRows; }
    
        1/2✓ Branch 1 taken 2 times.
✗ Branch 2 not taken.

      2
          SizeType size() const { return mNumRows; }
    
          //@}
    
          /// @brief Set the value at the given coordinates.
    
          /// @warning It is not safe to set values in the same row simultaneously
    
          /// from multiple threads.
    
          void setValue(SizeType row, SizeType col, const ValueType&);
    
          //@{
    
          /// @brief Return the value at the given coordinates.
    
          /// @warning It is not safe to get values from a row while another thread
    
          /// is setting values in that row.
    
          const ValueType& getValue(SizeType row, SizeType col) const;
    
          const ValueType& operator()(SizeType row, SizeType col) const;
    
          //@}
    
          /// Return a read-only view onto the given row of this matrix.
    
          ConstRow getConstRow(SizeType row) const;
    
          /// Return a read/write view onto the given row of this matrix.
    
          RowEditor getRowEditor(SizeType row);
    
          //@{
    
          /// @brief Multiply all elements in the matrix by @a s;
    
          template<typename Scalar> void scale(const Scalar& s);
    
          template<typename Scalar>
    
          SparseStencilMatrix& operator*=(const Scalar& s) { this->scale(s); return *this; }
    
          //@}
    
          /// @brief Multiply this matrix by @a inVec and return the result in @a resultVec.
    
          /// @throw ArithmeticError if either @a inVec or @a resultVec is not of size @e N,
    
          /// where @e N x @e N is the size of this matrix.
    
          template<typename VecValueType>
    
          void vectorMultiply(const Vector<VecValueType>& inVec, Vector<VecValueType>& resultVec) const;
    
          /// @brief Multiply this matrix by the vector represented by the array @a inVec
    
          /// and return the result in @a resultVec.
    
          /// @warning Both @a inVec and @a resultVec must have at least @e N elements,
    
          /// where @e N x @e N is the size of this matrix.
    
          template<typename VecValueType>
    
          void vectorMultiply(const VecValueType* inVec, VecValueType* resultVec) const;
    
          /// @brief Return @c true if this matrix is equivalent to the given matrix
    
          /// to within the specified tolerance.
    
          template<typename OtherValueType>
    
          bool eq(const SparseStencilMatrix<OtherValueType, STENCIL_SIZE>& other,
    
              ValueType eps = Tolerance<ValueType>::value()) const;
    
          /// Return @c true if every element of this matrix has a finite value.
    
          bool isFinite() const;
    
          /// Return a string representation of this matrix.
    
          std::string str() const;
    
      private:
    
          struct RowData {
    
      70502483
              RowData(ValueType* v, SizeType* c, SizeType& s): mVals(v), mCols(c), mSize(s) {}
    
              ValueType* mVals; SizeType* mCols; SizeType& mSize;
    
          };
    
          struct ConstRowData {
    
      1157260973
              ConstRowData(const ValueType* v, const SizeType* c, const SizeType& s):
    
      1157260973
                  mVals(v), mCols(c), mSize(s) {}
    
              const ValueType* mVals; const SizeType* mCols; const SizeType& mSize;
    
          };
    
          /// Base class for row accessors
    
          template<typename DataType_ = RowData>
    
          class RowBase
    
          {
    
          public:
    
              using DataType = DataType_;
    
              static SizeType capacity() { return STENCIL_SIZE; }
    
      1227763456
              RowBase(const DataType& data): mData(data) {}
    
      929686646
              bool empty() const { return (mData.mSize == 0); }
    
      1889530866
              const SizeType& size() const { return mData.mSize; }
    
              const ValueType& getValue(SizeType columnIdx, bool& active) const;
    
              const ValueType& getValue(SizeType columnIdx) const;
    
              /// Return an iterator over the stored values in this row.
    
              ConstValueIter cbegin() const;
    
              /// @brief Return @c true if this row is equivalent to the given row
    
              /// to within the specified tolerance.
    
              template<typename OtherDataType>
    
              bool eq(const RowBase<OtherDataType>& other,
    
                  ValueType eps = Tolerance<ValueType>::value()) const;
    
              /// @brief Return the dot product of this row with the first
    
              /// @a vecSize elements of @a inVec.
    
              /// @warning @a inVec must have at least @a vecSize elements.
    
              template<typename VecValueType>
    
              VecValueType dot(const VecValueType* inVec, SizeType vecSize) const;
    
              /// Return the dot product of this row with the given vector.
    
              template<typename VecValueType>
    
              VecValueType dot(const Vector<VecValueType>& inVec) const;
    
              /// Return a string representation of this row.
    
              std::string str() const;
    
          protected:
    
              friend class ConstValueIter;
    
      6075874694
              const ValueType& value(SizeType i) const { return mData.mVals[i]; }
    
      6107290272
              SizeType column(SizeType i) const { return mData.mCols[i]; }
    
              /// @brief Return the array index of the first column index that is
    
              /// equal to <i>or greater than</i> the given column index.
    
              /// @note If @a columnIdx is larger than any existing column index,
    
              /// the return value will point beyond the end of the array.
    
              SizeType find(SizeType columnIdx) const;
    
              DataType mData;
    
          };
    
          using ConstRowBase = RowBase<ConstRowData>;
    
      public:
    
          /// Iterator over the stored values in a row of this matrix
    
          class ConstValueIter
    
          {
    
          public:
    
              const ValueType& operator*() const
    
              {
    
        5/10✓ Branch 0 taken 18 times.
✗ Branch 1 not taken.
✓ Branch 2 taken 18 times.
✗ Branch 3 not taken.
✓ Branch 4 taken 26 times.
✗ Branch 5 not taken.
✓ Branch 6 taken 14169979 times.
✗ Branch 7 not taken.
✓ Branch 8 taken 10592476 times.
✗ Branch 9 not taken.

      24762517
                  if (mData.mSize == 0) return SparseStencilMatrix::sZeroValue;
    
      24762517
                  return mData.mVals[mCursor];
    
              }
    
      172613470
              SizeType column() const { return mData.mCols[mCursor]; }
    
      172613496
              void increment() { mCursor++; }
    
      172613496
              ConstValueIter& operator++() { increment(); return *this; }
    
      197516014
              operator bool() const { return (mCursor < mData.mSize); }
    
      3577503
              void reset() { mCursor = 0; }
    
          private:
    
              friend class SparseStencilMatrix;
    
              ConstValueIter(const RowData& d): mData(d.mVals, d.mCols, d.mSize), mCursor(0) {}
    
      21325005
              ConstValueIter(const ConstRowData& d): mData(d), mCursor(0) {}
    
              const ConstRowData mData;
    
              SizeType mCursor;
    
          };
    
          /// Read-only accessor to a row of this matrix
    
          class ConstRow: public ConstRowBase
    
          {
    
          public:
    
              ConstRow(const ValueType* valueHead, const SizeType* columnHead, const SizeType& rowSize);
    
          }; // class ConstRow
    
          /// Read/write accessor to a row of this matrix
    
          class RowEditor: public RowBase<>
    
          {
    
          public:
    
              RowEditor(ValueType* valueHead, SizeType* columnHead, SizeType& rowSize, SizeType colSize);
    
              /// Set the number of entries in this row to zero.
    
              void clear();
    
              /// @brief Set the value of the entry in the specified column.
    
              /// @return the current number of entries stored in this row.
    
              SizeType setValue(SizeType column, const ValueType& value);
    
              //@{
    
              /// @brief Scale all of the entries in this row.
    
              template<typename Scalar> void scale(const Scalar&);
    
              template<typename Scalar>
    
              RowEditor& operator*=(const Scalar& s) { this->scale(s); return *this; }
    
              //@}
    
          private:
    
              const SizeType mNumColumns; // used only for bounds checking
    
          }; // class RowEditor
    
      private:
    
          // Functors for use with tbb::parallel_for()
    
          struct MatrixCopyOp;
    
          template<typename VecValueType> struct VecMultOp;
    
          template<typename Scalar> struct RowScaleOp;
    
          // Functors for use with tbb::parallel_reduce()
    
          struct IsFiniteOp;
    
          template<typename OtherValueType> struct EqOp;
    
          const SizeType                  mNumRows;
    
          std::unique_ptr<ValueType[]>    mValueArray;
    
          std::unique_ptr<SizeType[]>     mColumnIdxArray;
    
          std::unique_ptr<SizeType[]>     mRowSizeArray;
    
      }; // class SparseStencilMatrix
    
      ////////////////////////////////////////
    
      /// Base class for conjugate gradient preconditioners
    
      template<typename T>
    
      class Preconditioner
    
      {
    
      public:
    
          using ValueType = T;
    
          using Ptr = SharedPtr<Preconditioner>;
    
      9
          template<SizeType STENCIL_SIZE> Preconditioner(const SparseStencilMatrix<T, STENCIL_SIZE>&) {}
    
          virtual ~Preconditioner() = default;
    
      ✗
          virtual bool isValid() const { return true; }
    
          /// @brief Apply this preconditioner to a residue vector:
    
          ///     @e z = <i>M</i><sup><small>&minus;1</small></sup><i>r</i>
    
          /// @param      r  residue vector
    
          /// @param[out] z  preconditioned residue vector
    
          virtual void apply(const Vector<T>& r, Vector<T>& z) = 0;
    
      };
    
      ////////////////////////////////////////
    
      namespace internal {
    
      // Functor for use with tbb::parallel_for() to copy data from one array to another
    
      template<typename T>
    
      struct CopyOp
    
      {
    
      11
          CopyOp(const T* from_, T* to_): from(from_), to(to_) {}
    
          void operator()(const SizeRange& range) const {
    
        6/8✓ Branch 0 taken 10 times.
✓ Branch 1 taken 10 times.
✗ Branch 2 not taken.
✗ Branch 3 not taken.
✓ Branch 4 taken 208424 times.
✓ Branch 5 taken 90 times.
✓ Branch 6 taken 3369084 times.
✓ Branch 7 taken 922 times.

      3578540
              for (SizeType n = range.begin(), N = range.end(); n < N; ++n) to[n] = from[n];
    
          }
    
          const T* from;
    
          T* to;
    
      };
    
      // Functor for use with tbb::parallel_for() to fill an array with a constant value
    
      template<typename T>
    
      struct FillOp
    
      {
    
      980
          FillOp(T* data_, const T& val_): data(data_), val(val_) {}
    
          void operator()(const SizeRange& range) const {
    
        8/8✓ Branch 0 taken 628072 times.
✓ Branch 1 taken 263 times.
✓ Branch 2 taken 10111654 times.
✓ Branch 3 taken 2899 times.
✓ Branch 4 taken 43822536 times.
✓ Branch 5 taken 9418 times.
✓ Branch 6 taken 687828130 times.
✓ Branch 7 taken 119409 times.

      742522381
              for (SizeType n = range.begin(), N = range.end(); n < N; ++n) data[n] = val;
    
          }
    
          T* data;
    
          const T val;
    
      };
    
      // Functor for use with tbb::parallel_for() that computes a * x + y
    
      template<typename T>
    
      struct LinearOp
    
      {
    
      1404
          LinearOp(const T& a_, const T* x_, const T* y_, T* out_): a(a_), x(x_), y(y_), out(out_) {}
    
        1/2✗ Branch 0 not taken.
✓ Branch 1 taken 261059 times.

      261059
          void operator()(const SizeRange& range) const {
    
        1/2✗ Branch 0 not taken.
✓ Branch 1 taken 261059 times.

      261059
              if (isExactlyEqual(a, T(1))) {
    
      ✗
                  for (SizeType n = range.begin(), N = range.end(); n < N; ++n) out[n] = x[n] + y[n];
    
        2/2✓ Branch 0 taken 1318 times.
✓ Branch 1 taken 259741 times.

      261059
              } else if (isExactlyEqual(a, T(-1))) {
    
        2/2✓ Branch 0 taken 3577508 times.
✓ Branch 1 taken 1318 times.

      3578826
                  for (SizeType n = range.begin(), N = range.end(); n < N; ++n) out[n] = -x[n] + y[n];
    
              } else {
    
        2/2✓ Branch 0 taken 1058425753 times.
✓ Branch 1 taken 259741 times.

      1058685494
                  for (SizeType n = range.begin(), N = range.end(); n < N; ++n) out[n] = a * x[n] + y[n];
    
              }
    
      261059
          }
    
          const T a, *x, *y;
    
          T* out;
    
      };
    
      } // namespace internal
    
      ////////////////////////////////////////
    
      inline std::ostream&
    
      operator<<(std::ostream& os, const State& state)
    
      {
    
          os << (state.success ? "succeeded with " : "")
    
              << "rel. err. " << state.relativeError << ", abs. err. " << state.absoluteError
    
              << " after " << state.iterations << " iteration" << (state.iterations == 1 ? "" : "s");
    
          return os;
    
      }
    
      ////////////////////////////////////////
    
      template<typename T>
    
      inline
    
      Vector<T>::Vector(const Vector& other): mData(new T[other.mSize]), mSize(other.mSize)
    
      {
    
          tbb::parallel_for(SizeRange(0, mSize),
    
              internal::CopyOp<T>(/*from=*/other.mData, /*to=*/mData));
    
      }
    
      template<typename T>
    
      inline
    
      9
      Vector<T>& Vector<T>::operator=(const Vector<T>& other)
    
      {
    
          // Update the internal storage to the correct size
    
        1/2✗ Branch 0 not taken.
✓ Branch 1 taken 9 times.

      9
          if (mSize != other.mSize) {
    
      ✗
              mSize = other.mSize;
    
      ✗
              delete[] mData;
    
      ✗
              mData = new T[mSize];
    
          }
    
          // Deep copy the data
    
      18
          tbb::parallel_for(SizeRange(0, mSize),
    
      9
              internal::CopyOp<T>(/*from=*/other.mData, /*to=*/mData));
    
      9
          return *this;
    
      }
    
      template<typename T>
    
      inline void
    
      Vector<T>::resize(SizeType n)
    
      {
    
          if (n != mSize) {
    
              if (mData) delete[] mData;
    
              mData = new T[n];
    
              mSize = n;
    
          }
    
      }
    
      template<typename T>
    
      inline void
    
      Vector<T>::fill(const ValueType& value)
    
      {
    
      951
          tbb::parallel_for(SizeRange(0, mSize), internal::FillOp<T>(mData, value));
    
      }
    
      template<typename T>
    
      template<typename Scalar>
    
      struct Vector<T>::ScaleOp
    
      {
    
      7
          ScaleOp(T* data_, const Scalar& s_): data(data_), s(s_) {}
    
          void operator()(const SizeRange& range) const {
    
        4/4✓ Branch 0 taken 223274 times.
✓ Branch 1 taken 57 times.
✓ Branch 2 taken 3354224 times.
✓ Branch 3 taken 848 times.

      3578403
              for (SizeType n = range.begin(), N = range.end(); n < N; ++n) data[n] *= s;
    
          }
    
          T* data;
    
          const Scalar s;
    
      };
    
      template<typename T>
    
      template<typename Scalar>
    
      inline void
    
      Vector<T>::scale(const Scalar& s)
    
      {
    
        8/32✓ Branch 1 taken 1 times.
✗ Branch 2 not taken.
✓ Branch 4 taken 1 times.
✗ Branch 5 not taken.
✓ Branch 7 taken 3 times.
✗ Branch 8 not taken.
✓ Branch 10 taken 3 times.
✗ Branch 11 not taken.
✓ Branch 13 taken 2 times.
✗ Branch 14 not taken.
✓ Branch 16 taken 2 times.
✗ Branch 17 not taken.
✗ Branch 19 not taken.
✗ Branch 20 not taken.
✗ Branch 22 not taken.
✗ Branch 23 not taken.
✗ Branch 25 not taken.
✗ Branch 26 not taken.
✗ Branch 28 not taken.
✗ Branch 29 not taken.
✗ Branch 31 not taken.
✗ Branch 32 not taken.
✗ Branch 34 not taken.
✗ Branch 35 not taken.
✗ Branch 37 not taken.
✗ Branch 38 not taken.
✗ Branch 40 not taken.
✗ Branch 41 not taken.
✓ Branch 43 taken 1 times.
✗ Branch 44 not taken.
✓ Branch 46 taken 1 times.
✗ Branch 47 not taken.

      7
          tbb::parallel_for(SizeRange(0, mSize), ScaleOp<Scalar>(mData, s));
    
      }
    
      template<typename T>
    
      struct Vector<T>::DeterministicDotProductOp
    
      {
    
      1258
          DeterministicDotProductOp(const T* a_, const T* b_,
    
                  const SizeType binCount_, const SizeType arraySize_, T* reducetmp_):
    
      1258
              a(a_), b(b_), binCount(binCount_), arraySize(arraySize_), reducetmp(reducetmp_) {}
    
      125800
          void operator()(const SizeRange& range) const
    
          {
    
      125800
              const SizeType binSize = arraySize / binCount;
    
              // Iterate over bins (array segments)
    
        2/2✓ Branch 0 taken 125800 times.
✓ Branch 1 taken 125800 times.

      251600
              for (SizeType n = range.begin(), N = range.end(); n < N; ++n) {
    
      125800
                  const SizeType begin = n * binSize;
    
        2/2✓ Branch 0 taken 1258 times.
✓ Branch 1 taken 124542 times.

      125800
                  const SizeType end = (n == binCount-1) ? arraySize : begin + binSize;
    
                  // Compute the partial sum for this array segment
    
                  T sum = zeroVal<T>();
    
        2/2✓ Branch 0 taken 1071899673 times.
✓ Branch 1 taken 125800 times.

      1072025473
                  for (SizeType i = begin; i < end; ++i) { sum += a[i] * b[i]; }
    
                  // Store the partial sum
    
      125800
                  reducetmp[n] = sum;
    
              }
    
      125800
          }
    
          const T* a;
    
          const T* b;
    
          const SizeType binCount;
    
          const SizeType arraySize;
    
          T* reducetmp;
    
      };
    
      template<typename T>
    
      inline T
    
      1415
      Vector<T>::dot(const Vector<T>& other) const
    
      {
    
        1/2✗ Branch 0 not taken.
✓ Branch 1 taken 1415 times.

      1415
          assert(this->size() == other.size());
    
          const T* aData = this->data();
    
          const T* bData = other.data();
    
          SizeType arraySize = this->size();
    
          T result = zeroVal<T>();
    
        2/2✓ Branch 0 taken 157 times.
✓ Branch 1 taken 1258 times.

      1415
          if (arraySize < 1024) {
    
              // Compute the dot product in serial for small arrays
    
        2/2✓ Branch 0 taken 139090 times.
✓ Branch 1 taken 157 times.

      139247
              for (SizeType n = 0; n < arraySize; ++n) {
    
      139090
                  result += aData[n] * bData[n];
    
              }
    
          } else {
    
              // Compute the dot product by segmenting the arrays into
    
              // a predetermined number of sub arrays in parallel and
    
              // accumulate the finial result in series.
    
              const SizeType binCount = 100;
    
              T partialSums[100];
    
      1258
              tbb::parallel_for(SizeRange(0, binCount),
    
                  DeterministicDotProductOp(aData, bData, binCount, arraySize, partialSums));
    
        2/2✓ Branch 0 taken 125800 times.
✓ Branch 1 taken 1258 times.

      127058
              for (SizeType n = 0; n < binCount; ++n) {
    
      125800
                  result += partialSums[n];
    
              }
    
          }
    
      1415
          return result;
    
      }
    
      template<typename T>
    
      struct Vector<T>::InfNormOp
    
      {
    
      489
          InfNormOp(const T* data_): data(data_) {}
    
          T operator()(const SizeRange& range, T maxValue) const
    
          {
    
        2/2✓ Branch 0 taken 361156103 times.
✓ Branch 1 taken 92418 times.

      361248521
              for (SizeType n = range.begin(), N = range.end(); n < N; ++n) {
    
        2/2✓ Branch 0 taken 100691 times.
✓ Branch 1 taken 361055412 times.

      361256794
                  maxValue = Max(maxValue, Abs(data[n]));
    
              }
    
      92418
              return maxValue;
    
          }
    
          const T* data;
    
      };
    
      template<typename T>
    
      inline T
    
      489
      Vector<T>::infNorm() const
    
      {
    
          // Parallelize over the elements of this vector.
    
      489
          T result = tbb::parallel_reduce(SizeRange(0, this->size()), /*seed=*/zeroVal<T>(),
    
      2845
              InfNormOp(this->data()), /*join=*/[](T max1, T max2) { return Max(max1, max2); });
    
      489
          return result;
    
      }
    
      template<typename T>
    
      struct Vector<T>::IsFiniteOp
    
      {
    
      9
          IsFiniteOp(const T* data_): data(data_) {}
    
          bool operator()(const SizeRange& range, bool finite) const
    
          {
    
        2/4✓ Branch 0 taken 71 times.
✗ Branch 1 not taken.
✓ Branch 2 taken 848 times.
✗ Branch 3 not taken.

      919
              if (finite) {
    
        4/4✓ Branch 0 taken 223328 times.
✓ Branch 1 taken 71 times.
✓ Branch 2 taken 3354180 times.
✓ Branch 3 taken 848 times.

      3578427
                  for (SizeType n = range.begin(), N = range.end(); n < N; ++n) {
    
        2/4✓ Branch 0 taken 223328 times.
✗ Branch 1 not taken.
✓ Branch 2 taken 3354180 times.
✗ Branch 3 not taken.

      3577508
                      if (!std::isfinite(data[n])) return false;
    
                  }
    
              }
    
              return finite;
    
          }
    
          const T* data;
    
      };
    
      template<typename T>
    
      inline bool
    
      9
      Vector<T>::isFinite() const
    
      {
    
          // Parallelize over the elements of this vector.
    
      9
          bool finite = tbb::parallel_reduce(SizeRange(0, this->size()), /*seed=*/true,
    
              IsFiniteOp(this->data()),
    
      9
              /*join=*/[](bool finite1, bool finite2) { return (finite1 && finite2); });
    
      9
          return finite;
    
      }
    
      template<typename T>
    
      template<typename OtherValueType>
    
      struct Vector<T>::EqOp
    
      {
    
      2
          EqOp(const T* a_, const OtherValueType* b_, T e): a(a_), b(b_), eps(e) {}
    
          bool operator()(const SizeRange& range, bool equal) const
    
          {
    
        1/2✓ Branch 0 taken 10 times.
✗ Branch 1 not taken.

      10
              if (equal) {
    
        2/2✓ Branch 0 taken 10 times.
✓ Branch 1 taken 10 times.

      20
                  for (SizeType n = range.begin(), N = range.end(); n < N; ++n) {
    
        1/2✓ Branch 0 taken 10 times.
✗ Branch 1 not taken.

      10
                      if (!isApproxEqual(a[n], b[n], eps)) return false;
    
                  }
    
              }
    
              return equal;
    
          }
    
          const T* a;
    
          const OtherValueType* b;
    
          const T eps;
    
      };
    
      template<typename T>
    
      template<typename OtherValueType>
    
      inline bool
    
      2
      Vector<T>::eq(const Vector<OtherValueType>& other, ValueType eps) const
    
      {
    
        1/2✓ Branch 0 taken 2 times.
✗ Branch 1 not taken.

      2
          if (this->size() != other.size()) return false;
    
      2
          bool equal = tbb::parallel_reduce(SizeRange(0, this->size()), /*seed=*/true,
    
              EqOp<OtherValueType>(this->data(), other.data(), eps),
    
      ✗
              /*join=*/[](bool eq1, bool eq2) { return (eq1 && eq2); });
    
      2
          return equal;
    
      }
    
      template<typename T>
    
      inline std::string
    
      Vector<T>::str() const
    
      {
    
          std::ostringstream ostr;
    
          ostr << "[";
    
          std::string sep;
    
          for (SizeType n = 0, N = this->size(); n < N; ++n) {
    
              ostr << sep << (*this)[n];
    
              sep = ", ";
    
          }
    
          ostr << "]";
    
          return ostr.str();
    
      }
    
      ////////////////////////////////////////
    
      template<typename ValueType, SizeType STENCIL_SIZE>
    
      const ValueType SparseStencilMatrix<ValueType, STENCIL_SIZE>::sZeroValue = zeroVal<ValueType>();
    
      template<typename ValueType, SizeType STENCIL_SIZE>
    
      inline
    
      58
      SparseStencilMatrix<ValueType, STENCIL_SIZE>::SparseStencilMatrix(SizeType numRows)
    
          : mNumRows(numRows)
    
      58
          , mValueArray(new ValueType[mNumRows * STENCIL_SIZE])
    
        1/2✓ Branch 1 taken 29 times.
✗ Branch 2 not taken.

      58
          , mColumnIdxArray(new SizeType[mNumRows * STENCIL_SIZE])
    
        1/2✓ Branch 2 taken 29 times.
✗ Branch 3 not taken.

      116
          , mRowSizeArray(new SizeType[mNumRows])
    
      {
    
          // Initialize the matrix to a null state by setting the size of each row to zero.
    
        1/4✓ Branch 1 taken 29 times.
✗ Branch 2 not taken.
✗ Branch 3 not taken.
✗ Branch 4 not taken.

      58
          tbb::parallel_for(SizeRange(0, mNumRows),
    
              internal::FillOp<SizeType>(mRowSizeArray.get(), /*value=*/0));
    
      58
      }
    
      template<typename ValueType, SizeType STENCIL_SIZE>
    
      struct SparseStencilMatrix<ValueType, STENCIL_SIZE>::MatrixCopyOp
    
      {
    
      2
          MatrixCopyOp(const SparseStencilMatrix& from_, SparseStencilMatrix& to_):
    
      2
              from(&from_), to(&to_) {}
    
      40
          void operator()(const SizeRange& range) const
    
          {
    
      40
              const ValueType* fromVal = from->mValueArray.get();
    
              const SizeType* fromCol = from->mColumnIdxArray.get();
    
      40
              ValueType* toVal = to->mValueArray.get();
    
              SizeType* toCol = to->mColumnIdxArray.get();
    
        2/2✓ Branch 0 taken 40 times.
✓ Branch 1 taken 40 times.

      80
              for (SizeType n = range.begin(), N = range.end(); n < N; ++n) {
    
      40
                  toVal[n] = fromVal[n];
    
      40
                  toCol[n] = fromCol[n];
    
              }
    
      40
          }
    
          const SparseStencilMatrix* from; SparseStencilMatrix* to;
    
      };
    
      template<typename ValueType, SizeType STENCIL_SIZE>
    
      inline
    
      2
      SparseStencilMatrix<ValueType, STENCIL_SIZE>::SparseStencilMatrix(const SparseStencilMatrix& other)
    
      2
          : mNumRows(other.mNumRows)
    
      2
          , mValueArray(new ValueType[mNumRows * STENCIL_SIZE])
    
        1/2✓ Branch 1 taken 2 times.
✗ Branch 2 not taken.

      2
          , mColumnIdxArray(new SizeType[mNumRows * STENCIL_SIZE])
    
        1/2✓ Branch 2 taken 2 times.
✗ Branch 3 not taken.

      4
          , mRowSizeArray(new SizeType[mNumRows])
    
      {
    
        1/2✓ Branch 1 taken 2 times.
✗ Branch 2 not taken.

      2
          SizeType size = mNumRows * STENCIL_SIZE;
    
          // Copy the value and column index arrays from the other matrix to this matrix.
    
        2/4✓ Branch 1 taken 2 times.
✗ Branch 2 not taken.
✓ Branch 4 taken 2 times.
✗ Branch 5 not taken.

      2
          tbb::parallel_for(SizeRange(0, size), MatrixCopyOp(/*from=*/other, /*to=*/*this));
    
          // Copy the row size array from the other matrix to this matrix.
    
        1/4✓ Branch 1 taken 2 times.
✗ Branch 2 not taken.
✗ Branch 3 not taken.
✗ Branch 4 not taken.

      2
          tbb::parallel_for(SizeRange(0, mNumRows),
    
              internal::CopyOp<SizeType>(/*from=*/other.mRowSizeArray.get(), /*to=*/mRowSizeArray.get()));
    
      2
      }
    
      template<typename ValueType, SizeType STENCIL_SIZE>
    
      inline void
    
      88
      SparseStencilMatrix<ValueType, STENCIL_SIZE>::setValue(SizeType row, SizeType col,
    
          const ValueType& val)
    
      {
    
        1/2✗ Branch 0 not taken.
✓ Branch 1 taken 44 times.

      88
          assert(row < mNumRows);
    
      88
          this->getRowEditor(row).setValue(col, val);
    
      88
      }
    
      template<typename ValueType, SizeType STENCIL_SIZE>
    
      inline const ValueType&
    
      28339968
      SparseStencilMatrix<ValueType, STENCIL_SIZE>::getValue(SizeType row, SizeType col) const
    
      {
    
        1/2✗ Branch 0 not taken.
✓ Branch 1 taken 14169984 times.

      28339968
          assert(row < mNumRows);
    
      28339968
          return this->getConstRow(row).getValue(col);
    
      }
    
      template<typename ValueType, SizeType STENCIL_SIZE>
    
      inline const ValueType&
    
      SparseStencilMatrix<ValueType, STENCIL_SIZE>::operator()(SizeType row, SizeType col) const
    
      {
    
          return this->getValue(row,col);
    
      }
    
      template<typename ValueType, SizeType STENCIL_SIZE>
    
      template<typename Scalar>
    
      struct SparseStencilMatrix<ValueType, STENCIL_SIZE>::RowScaleOp
    
      {
    
      9
          RowScaleOp(SparseStencilMatrix& m, const Scalar& s_): mat(&m), s(s_) {}
    
      1428
          void operator()(const SizeRange& range) const
    
          {
    
        2/2✓ Branch 0 taken 3584700 times.
✓ Branch 1 taken 1428 times.

      3586128
              for (SizeType n = range.begin(), N = range.end(); n < N; ++n) {
    
      3584700
                  RowEditor row = mat->getRowEditor(n);
    
                  row.scale(s);
    
              }
    
      1428
          }
    
          SparseStencilMatrix* mat;
    
          const Scalar s;
    
      };
    
      template<typename ValueType, SizeType STENCIL_SIZE>
    
      template<typename Scalar>
    
      inline void
    
      SparseStencilMatrix<ValueType, STENCIL_SIZE>::scale(const Scalar& s)
    
      {
    
          // Parallelize over the rows in the matrix.
    
        10/32✓ Branch 1 taken 1 times.
✗ Branch 2 not taken.
✓ Branch 4 taken 1 times.
✗ Branch 5 not taken.
✓ Branch 7 taken 3 times.
✗ Branch 8 not taken.
✓ Branch 10 taken 3 times.
✗ Branch 11 not taken.
✓ Branch 13 taken 2 times.
✗ Branch 14 not taken.
✓ Branch 16 taken 2 times.
✗ Branch 17 not taken.
✓ Branch 19 taken 2 times.
✗ Branch 20 not taken.
✓ Branch 22 taken 2 times.
✗ Branch 23 not taken.
✗ Branch 25 not taken.
✗ Branch 26 not taken.
✗ Branch 28 not taken.
✗ Branch 29 not taken.
✗ Branch 31 not taken.
✗ Branch 32 not taken.
✗ Branch 34 not taken.
✗ Branch 35 not taken.
✗ Branch 37 not taken.
✗ Branch 38 not taken.
✗ Branch 40 not taken.
✗ Branch 41 not taken.
✓ Branch 43 taken 1 times.
✗ Branch 44 not taken.
✓ Branch 46 taken 1 times.
✗ Branch 47 not taken.

      9
          tbb::parallel_for(SizeRange(0, mNumRows), RowScaleOp<Scalar>(*this, s));
    
      }
    
      template<typename ValueType, SizeType STENCIL_SIZE>
    
      template<typename VecValueType>
    
      struct SparseStencilMatrix<ValueType, STENCIL_SIZE>::VecMultOp
    
      {
    
      482
          VecMultOp(const SparseStencilMatrix& m, const VecValueType* i, VecValueType* o):
    
      482
              mat(&m), in(i), out(o) {}
    
      70612
          void operator()(const SizeRange& range) const
    
          {
    
        2/2✓ Branch 0 taken 357585797 times.
✓ Branch 1 taken 70356 times.

      357663611
              for (SizeType n = range.begin(), N = range.end(); n < N; ++n) {
    
      357592999
                  ConstRow row = mat->getConstRow(n);
    
      357592999
                  out[n] = row.dot(in, mat->numRows());
    
              }
    
      70612
          }
    
          const SparseStencilMatrix* mat;
    
          const VecValueType* in;
    
          VecValueType* out;
    
      };
    
      template<typename ValueType, SizeType STENCIL_SIZE>
    
      template<typename VecValueType>
    
      inline void
    
      475
      SparseStencilMatrix<ValueType, STENCIL_SIZE>::vectorMultiply(
    
          const Vector<VecValueType>& inVec, Vector<VecValueType>& resultVec) const
    
      {
    
        1/2✗ Branch 0 not taken.
✓ Branch 1 taken 473 times.

      475
          if (inVec.size() != mNumRows) {
    
      ✗
              OPENVDB_THROW(ArithmeticError, "matrix and input vector have incompatible sizes ("
    
                  << mNumRows << "x" << mNumRows << " vs. " << inVec.size() << ")");
    
          }
    
        1/2✗ Branch 0 not taken.
✓ Branch 1 taken 473 times.

      475
          if (resultVec.size() != mNumRows) {
    
      ✗
              OPENVDB_THROW(ArithmeticError, "matrix and result vector have incompatible sizes ("
    
                  << mNumRows << "x" << mNumRows << " vs. " << resultVec.size() << ")");
    
          }
    
          vectorMultiply(inVec.data(), resultVec.data());
    
      475
      }
    
      template<typename ValueType, SizeType STENCIL_SIZE>
    
      template<typename VecValueType>
    
      inline void
    
      SparseStencilMatrix<ValueType, STENCIL_SIZE>::vectorMultiply(
    
          const VecValueType* inVec, VecValueType* resultVec) const
    
      {
    
          // Parallelize over the rows in the matrix.
    
      482
          tbb::parallel_for(SizeRange(0, mNumRows),
    
              VecMultOp<VecValueType>(*this, inVec, resultVec));
    
      }
    
      template<typename ValueType, SizeType STENCIL_SIZE>
    
      template<typename OtherValueType>
    
      struct SparseStencilMatrix<ValueType, STENCIL_SIZE>::EqOp
    
      {
    
      2
          EqOp(const SparseStencilMatrix& a_,
    
              const SparseStencilMatrix<OtherValueType, STENCIL_SIZE>& b_, ValueType e):
    
      2
              a(&a_), b(&b_), eps(e) {}
    
      10
          bool operator()(const SizeRange& range, bool equal) const
    
          {
    
        1/2✓ Branch 0 taken 10 times.
✗ Branch 1 not taken.

      10
              if (equal) {
    
        2/2✓ Branch 0 taken 10 times.
✓ Branch 1 taken 10 times.

      20
                  for (SizeType n = range.begin(), N = range.end(); n < N; ++n) {
    
        1/2✓ Branch 3 taken 10 times.
✗ Branch 4 not taken.

      10
                      if (!a->getConstRow(n).eq(b->getConstRow(n), eps)) return false;
    
                  }
    
              }
    
              return equal;
    
          }
    
          const SparseStencilMatrix* a;
    
          const SparseStencilMatrix<OtherValueType, STENCIL_SIZE>* b;
    
          const ValueType eps;
    
      };
    
      template<typename ValueType, SizeType STENCIL_SIZE>
    
      template<typename OtherValueType>
    
      inline bool
    
      2
      SparseStencilMatrix<ValueType, STENCIL_SIZE>::eq(
    
          const SparseStencilMatrix<OtherValueType, STENCIL_SIZE>& other, ValueType eps) const
    
      {
    
        1/2✓ Branch 0 taken 2 times.
✗ Branch 1 not taken.

      2
          if (this->numRows() != other.numRows()) return false;
    
      2
          bool equal = tbb::parallel_reduce(SizeRange(0, this->numRows()), /*seed=*/true,
    
              EqOp<OtherValueType>(*this, other, eps),
    
      1
              /*join=*/[](bool eq1, bool eq2) { return (eq1 && eq2); });
    
      2
          return equal;
    
      }
    
      template<typename ValueType, SizeType STENCIL_SIZE>
    
      struct SparseStencilMatrix<ValueType, STENCIL_SIZE>::IsFiniteOp
    
      {
    
      2
          IsFiniteOp(const SparseStencilMatrix& m): mat(&m) {}
    
      10
          bool operator()(const SizeRange& range, bool finite) const
    
          {
    
        1/2✓ Branch 0 taken 10 times.
✗ Branch 1 not taken.

      10
              if (finite) {
    
        2/2✓ Branch 0 taken 10 times.
✓ Branch 1 taken 10 times.

      20
                  for (SizeType n = range.begin(), N = range.end(); n < N; ++n) {
    
      10
                      const ConstRow row = mat->getConstRow(n);
    
        2/2✓ Branch 0 taken 26 times.
✓ Branch 1 taken 10 times.

      36
                      for (ConstValueIter it = row.cbegin(); it; ++it) {
    
        1/2✗ Branch 0 not taken.
✓ Branch 1 taken 26 times.

      26
                          if (!std::isfinite(*it)) return false;
    
                      }
    
                  }
    
              }
    
              return finite;
    
          }
    
          const SparseStencilMatrix* mat;
    
      };
    
      template<typename ValueType, SizeType STENCIL_SIZE>
    
      inline bool
    
      2
      SparseStencilMatrix<ValueType, STENCIL_SIZE>::isFinite() const
    
      {
    
          // Parallelize over the rows of this matrix.
    
      2
          bool finite = tbb::parallel_reduce(SizeRange(0, this->numRows()), /*seed=*/true,
    
      ✗
              IsFiniteOp(*this), /*join=*/[](bool finite1, bool finite2) { return (finite1&&finite2); });
    
      2
          return finite;
    
      }
    
      template<typename ValueType, SizeType STENCIL_SIZE>
    
      inline std::string
    
      SparseStencilMatrix<ValueType, STENCIL_SIZE>::str() const
    
      {
    
          std::ostringstream ostr;
    
          for (SizeType n = 0, N = this->size(); n < N; ++n) {
    
              ostr << n << ": " << this->getConstRow(n).str() << "\n";
    
          }
    
          return ostr.str();
    
      }
    
      template<typename ValueType, SizeType STENCIL_SIZE>
    
      inline typename SparseStencilMatrix<ValueType, STENCIL_SIZE>::RowEditor
    
      141004966
      SparseStencilMatrix<ValueType, STENCIL_SIZE>::getRowEditor(SizeType i)
    
      {
    
        1/2✗ Branch 0 not taken.
✓ Branch 1 taken 70502483 times.

      141004966
          assert(i < mNumRows);
    
      14338852
          const SizeType head = i * STENCIL_SIZE;
    
      141004966
          return RowEditor(&mValueArray[head], &mColumnIdxArray[head], mRowSizeArray[i], mNumRows);
    
      }
    
      template<typename ValueType, SizeType STENCIL_SIZE>
    
      inline typename SparseStencilMatrix<ValueType, STENCIL_SIZE>::ConstRow
    
      2314521946
      SparseStencilMatrix<ValueType, STENCIL_SIZE>::getConstRow(SizeType i) const
    
      {
    
        1/2✗ Branch 0 not taken.
✓ Branch 1 taken 1157260973 times.

      2314521946
          assert(i < mNumRows);
    
      757821594
          const SizeType head = i * STENCIL_SIZE; // index for this row into main storage
    
      2314521946
          return ConstRow(&mValueArray[head], &mColumnIdxArray[head], mRowSizeArray[i]);
    
      }
    
      template<typename ValueType, SizeType STENCIL_SIZE>
    
      template<typename DataType>
    
      inline SizeType
    
      1859373292
      SparseStencilMatrix<ValueType, STENCIL_SIZE>::RowBase<DataType>::find(SizeType columnIdx) const
    
      {
    
        2/2✓ Branch 0 taken 918946920 times.
✓ Branch 1 taken 10739726 times.

      1859373292
          if (this->empty()) return mData.mSize;
    
          // Get a pointer to the first column index that is equal to or greater than the given index.
    
          // (This assumes that the data is sorted by column.)
    
      1837893840
          const SizeType* colPtr = std::lower_bound(mData.mCols, mData.mCols + mData.mSize, columnIdx);
    
          // Return the offset of the pointer from the beginning of the array.
    
      1837893840
          return static_cast<SizeType>(colPtr - mData.mCols);
    
      }
    
      template<typename ValueType, SizeType STENCIL_SIZE>
    
      template<typename DataType>
    
      inline const ValueType&
    
      SparseStencilMatrix<ValueType, STENCIL_SIZE>::RowBase<DataType>::getValue(
    
          SizeType columnIdx, bool& active) const
    
      {
    
          active = false;
    
          SizeType idx = this->find(columnIdx);
    
          if (idx < this->size() && this->column(idx) == columnIdx) {
    
              active = true;
    
              return this->value(idx);
    
          }
    
          return SparseStencilMatrix::sZeroValue;
    
      }
    
      template<typename ValueType, SizeType STENCIL_SIZE>
    
      template<typename DataType>
    
      inline const ValueType&
    
      1640716430
      SparseStencilMatrix<ValueType, STENCIL_SIZE>::RowBase<DataType>::getValue(SizeType columnIdx) const
    
      {
    
      1640716430
          SizeType idx = this->find(columnIdx);
    
        3/4✓ Branch 0 taken 820358215 times.
✗ Branch 1 not taken.
✓ Branch 2 taken 788942637 times.
✓ Branch 3 taken 31415578 times.

      1640716430
          if (idx < this->size() && this->column(idx) == columnIdx) {
    
      1577885274
              return this->value(idx);
    
          }
    
          return SparseStencilMatrix::sZeroValue;
    
      }
    
      template<typename ValueType, SizeType STENCIL_SIZE>
    
      template<typename DataType>
    
      inline typename SparseStencilMatrix<ValueType, STENCIL_SIZE>::ConstValueIter
    
      SparseStencilMatrix<ValueType, STENCIL_SIZE>::RowBase<DataType>::cbegin() const
    
      {
    
      21325005
          return ConstValueIter(mData);
    
      }
    
      template<typename ValueType, SizeType STENCIL_SIZE>
    
      template<typename DataType>
    
      template<typename OtherDataType>
    
      inline bool
    
      10
      SparseStencilMatrix<ValueType, STENCIL_SIZE>::RowBase<DataType>::eq(
    
          const RowBase<OtherDataType>& other, ValueType eps) const
    
      {
    
        1/2✓ Branch 0 taken 10 times.
✗ Branch 1 not taken.

      10
          if (this->size() != other.size()) return false;
    
        3/4✓ Branch 0 taken 10 times.
✓ Branch 1 taken 18 times.
✗ Branch 2 not taken.
✓ Branch 3 taken 10 times.

      28
          for (ConstValueIter it = cbegin(), oit = other.cbegin(); it || oit; ++it, ++oit) {
    
        1/2✓ Branch 0 taken 18 times.
✗ Branch 1 not taken.

      18
              if (it.column() != oit.column()) return false;
    
        1/2✓ Branch 0 taken 18 times.
✗ Branch 1 not taken.

      18
              if (!isApproxEqual(*it, *oit, eps)) return false;
    
          }
    
      10
          return true;
    
      }
    
      template<typename ValueType, SizeType STENCIL_SIZE>
    
      template<typename DataType>
    
      template<typename VecValueType>
    
      inline VecValueType
    
        2/2✓ Branch 0 taken 1065587933 times.
✓ Branch 1 taken 8 times.

      2131175882
      SparseStencilMatrix<ValueType, STENCIL_SIZE>::RowBase<DataType>::dot(
    
          const VecValueType* inVec, SizeType vecSize) const
    
      {
    
          VecValueType result = zeroVal<VecValueType>();
    
        2/2✓ Branch 0 taken 5286932057 times.
✓ Branch 1 taken 1065587941 times.

      12705039996
          for (SizeType idx = 0, N = std::min(vecSize, this->size()); idx < N; ++idx) {
    
      10573864114
              result += static_cast<VecValueType>(this->value(idx) * inVec[this->column(idx)]);
    
          }
    
      2131175882
          return result;
    
      }
    
      template<typename ValueType, SizeType STENCIL_SIZE>
    
      template<typename DataType>
    
      template<typename VecValueType>
    
      inline VecValueType
    
      SparseStencilMatrix<ValueType, STENCIL_SIZE>::RowBase<DataType>::dot(
    
          const Vector<VecValueType>& inVec) const
    
      {
    
      708002144
          return dot(inVec.data(), inVec.size());
    
      }
    
      template<typename ValueType, SizeType STENCIL_SIZE>
    
      template<typename DataType>
    
      inline std::string
    
      SparseStencilMatrix<ValueType, STENCIL_SIZE>::RowBase<DataType>::str() const
    
      {
    
          std::ostringstream ostr;
    
          std::string sep;
    
          for (SizeType n = 0, N = this->size(); n < N; ++n) {
    
              ostr << sep << "(" << this->column(n) << ", " << this->value(n) << ")";
    
              sep = ", ";
    
          }
    
          return ostr.str();
    
      }
    
      template<typename ValueType, SizeType STENCIL_SIZE>
    
      inline
    
      SparseStencilMatrix<ValueType, STENCIL_SIZE>::ConstRow::ConstRow(
    
          const ValueType* valueHead, const SizeType* columnHead, const SizeType& rowSize):
    
          ConstRowBase(ConstRowData(const_cast<ValueType*>(valueHead),
    
      1157260973
              const_cast<SizeType*>(columnHead), const_cast<SizeType&>(rowSize)))
    
      {
    
      }
    
      template<typename ValueType, SizeType STENCIL_SIZE>
    
      inline
    
      70502483
      SparseStencilMatrix<ValueType, STENCIL_SIZE>::RowEditor::RowEditor(
    
          ValueType* valueHead, SizeType* columnHead, SizeType& rowSize, SizeType colSize):
    
      70502483
          RowBase<>(RowData(valueHead, columnHead, rowSize)), mNumColumns(colSize)
    
      {
    
      }
    
      template<typename ValueType, SizeType STENCIL_SIZE>
    
      inline void
    
      SparseStencilMatrix<ValueType, STENCIL_SIZE>::RowEditor::clear()
    
      {
    
          // Note: since mSize is a reference, this modifies the underlying matrix.
    
      7155006
          RowBase<>::mData.mSize = 0;
    
      }
    
      template<typename ValueType, SizeType STENCIL_SIZE>
    
      inline SizeType
    
      218656862
      SparseStencilMatrix<ValueType, STENCIL_SIZE>::RowEditor::setValue(
    
          SizeType column, const ValueType& value)
    
      {
    
        1/2✗ Branch 0 not taken.
✓ Branch 1 taken 109328431 times.

      218656862
          assert(column < mNumColumns);
    
          RowData& data = RowBase<>::mData;
    
          // Get the offset of the first column index that is equal to or greater than
    
          // the column to be modified.
    
      218656862
          SizeType offset = this->find(column);
    
        4/4✓ Branch 0 taken 59318229 times.
✓ Branch 1 taken 50010202 times.
✓ Branch 2 taken 56178033 times.
✓ Branch 3 taken 3140196 times.

      218656862
          if (offset < data.mSize && data.mCols[offset] == column) {
    
              // If the column already exists, just update its value.
    
      112356066
              data.mVals[offset] = value;
    
      112356066
              return data.mSize;
    
          }
    
          // Check that it is safe to add a new column.
    
        1/2✗ Branch 0 not taken.
✓ Branch 1 taken 53150398 times.

      106300796
          assert(data.mSize < this->capacity());
    
        2/2✓ Branch 0 taken 50010202 times.
✓ Branch 1 taken 3140196 times.

      106300796
          if (offset >= data.mSize) {
    
              // The new column's index is larger than any existing index.  Append the new column.
    
      100020404
              data.mVals[data.mSize] = value;
    
      100020404
              data.mCols[data.mSize] = column;
    
          } else {
    
              // Insert the new column at the computed offset after shifting subsequent columns.
    
        2/2✓ Branch 0 taken 4811545 times.
✓ Branch 1 taken 3140196 times.

      15903482
              for (SizeType i = data.mSize; i > offset; --i) {
    
      9623090
                  data.mVals[i] = data.mVals[i - 1];
    
      9623090
                  data.mCols[i] = data.mCols[i - 1];
    
              }
    
      6280392
              data.mVals[offset] = value;
    
      6280392
              data.mCols[offset] = column;
    
          }
    
      106300796
          ++data.mSize;
    
      106300796
          return data.mSize;
    
      }
    
      template<typename ValueType, SizeType STENCIL_SIZE>
    
      template<typename Scalar>
    
      inline void
    
      SparseStencilMatrix<ValueType, STENCIL_SIZE>::RowEditor::scale(const Scalar& s)
    
      {
    
        2/2✓ Branch 0 taken 24810396 times.
✓ Branch 1 taken 3584700 times.

      28395096
          for (int idx = 0, N = this->size(); idx < N; ++idx) {
    
      24810396
              RowBase<>::mData.mVals[idx] *= s;
    
          }
    
      }
    
      ////////////////////////////////////////
    
      /// Diagonal preconditioner
    
      template<typename MatrixType>
    
      class JacobiPreconditioner: public Preconditioner<typename MatrixType::ValueType>
    
      {
    
      private:
    
          struct InitOp;
    
          struct ApplyOp;
    
      public:
    
          using ValueType = typename MatrixType::ValueType;
    
          using BaseType = Preconditioner<ValueType>;
    
          using VectorType = Vector<ValueType>;
    
          using Ptr = SharedPtr<JacobiPreconditioner>;
    
      1
          JacobiPreconditioner(const MatrixType& A): BaseType(A), mDiag(A.numRows())
    
          {
    
              // Initialize vector mDiag with the values from the matrix diagonal.
    
        1/4✓ Branch 1 taken 1 times.
✗ Branch 2 not taken.
✗ Branch 3 not taken.
✗ Branch 4 not taken.

      1
              tbb::parallel_for(SizeRange(0, A.numRows()), InitOp(A, mDiag.data()));
    
      1
          }
    
        2/6✓ Branch 0 taken 1 times.
✗ Branch 1 not taken.
✓ Branch 2 taken 1 times.
✗ Branch 3 not taken.
✗ Branch 4 not taken.
✗ Branch 5 not taken.

      2
          ~JacobiPreconditioner() override = default;
    
      3
          void apply(const Vector<ValueType>& r, Vector<ValueType>& z) override
    
          {
    
              const SizeType size = mDiag.size();
    
        1/2✗ Branch 0 not taken.
✓ Branch 1 taken 3 times.

      3
              assert(r.size() == z.size());
    
        1/2✗ Branch 0 not taken.
✓ Branch 1 taken 3 times.

      3
              assert(r.size() == size);
    
      3
              tbb::parallel_for(SizeRange(0, size), ApplyOp(mDiag.data(), r.data(), z.data()));
    
      3
          }
    
          /// Return @c true if all values along the diagonal are finite.
    
          bool isFinite() const { return mDiag.isFinite(); }
    
      private:
    
          // Functor for use with tbb::parallel_for()
    
          struct InitOp
    
          {
    
        1/2✓ Branch 1 taken 1 times.
✗ Branch 2 not taken.

      1
              InitOp(const MatrixType& m, ValueType* v): mat(&m), vec(v) {}
    
      5
              void operator()(const SizeRange& range) const {
    
        2/2✓ Branch 0 taken 5 times.
✓ Branch 1 taken 5 times.

      10
                  for (SizeType n = range.begin(), N = range.end(); n < N; ++n) {
    
        1/2✗ Branch 1 not taken.
✓ Branch 2 taken 5 times.

      5
                      const ValueType val = mat->getValue(n, n);
    
      ✗
                      assert(!isApproxZero(val, ValueType(0.0001)));
    
      5
                      vec[n] = static_cast<ValueType>(1.0 / val);
    
                  }
    
      5
              }
    
              const MatrixType* mat; ValueType* vec;
    
          };
    
          // Functor for use with tbb::parallel_reduce()
    
          struct ApplyOp
    
          {
    
      3
              ApplyOp(const ValueType* x_, const ValueType* y_, ValueType* out_):
    
      3
                  x(x_), y(y_), out(out_) {}
    
              void operator()(const SizeRange& range) const {
    
        2/4✓ Branch 0 taken 15 times.
✓ Branch 1 taken 15 times.
✗ Branch 2 not taken.
✗ Branch 3 not taken.

      30
                  for (SizeType n = range.begin(), N = range.end(); n < N; ++n) out[n] = x[n] * y[n];
    
              }
    
              const ValueType *x, *y; ValueType* out;
    
          };
    
          // The Jacobi preconditioner is a diagonal matrix
    
          VectorType mDiag;
    
      }; // class JacobiPreconditioner
    
      /// Preconditioner using incomplete Cholesky factorization
    
      template<typename MatrixType>
    
      class IncompleteCholeskyPreconditioner: public Preconditioner<typename MatrixType::ValueType>
    
      {
    
      private:
    
          struct CopyToLowerOp;
    
          struct TransposeOp;
    
      public:
    
          using ValueType = typename MatrixType::ValueType;
    
          using BaseType = Preconditioner<ValueType>;
    
          using VectorType = Vector<ValueType>;
    
          using Ptr = SharedPtr<IncompleteCholeskyPreconditioner>;
    
          using TriangularMatrix = SparseStencilMatrix<ValueType, 4>;
    
          using TriangleConstRow = typename TriangularMatrix::ConstRow;
    
          using TriangleRowEditor = typename TriangularMatrix::RowEditor;
    
      8
          IncompleteCholeskyPreconditioner(const MatrixType& matrix)
    
              : BaseType(matrix)
    
              , mLowerTriangular(matrix.numRows())
    
              , mUpperTriangular(matrix.numRows())
    
        1/2✓ Branch 2 taken 8 times.
✗ Branch 3 not taken.

      8
              , mTempVec(matrix.numRows())
    
          {
    
              // Size of matrix
    
              const SizeType numRows = mLowerTriangular.numRows();
    
              // Copy the upper triangular part to the lower triangular part.
    
        1/2✓ Branch 1 taken 8 times.
✗ Branch 2 not taken.

      8
              tbb::parallel_for(SizeRange(0, numRows), CopyToLowerOp(matrix, mLowerTriangular));
    
              // Build the Incomplete Cholesky Matrix
    
              //
    
              // Algorithm:
    
              //
    
              // for (k = 0; k < size; ++k) {
    
              //     A(k,k) = sqrt(A(k,k));
    
              //     for (i = k +1, i < size; ++i) {
    
              //         if (A(i,k) == 0) continue;
    
              //         A(i,k) = A(i,k) / A(k,k);
    
              //     }
    
              //     for (j = k+1; j < size; ++j) {
    
              //         for (i = j; i < size; ++i) {
    
              //             if (A(i,j) == 0) continue;
    
              //             A(i,j) -= A(i,k)*A(j,k);
    
              //         }
    
              //     }
    
              // }
    
      8
              mPassedCompatibilityCondition = true;
    
        2/2✓ Branch 0 taken 3577503 times.
✓ Branch 1 taken 8 times.

      3577511
              for (SizeType k = 0; k < numRows; ++k) {
    
      3577503
                  TriangleConstRow crow_k = mLowerTriangular.getConstRow(k);
    
      3577503
                  ValueType diagonalValue = crow_k.getValue(k);
    
                  // Test if the matrix build has failed.
    
        1/2✗ Branch 0 not taken.
✓ Branch 1 taken 3577503 times.

      3577503
                  if (diagonalValue < 1.e-5) {
    
      ✗
                      mPassedCompatibilityCondition = false;
    
      ✗
                      break;
    
                  }
    
      3577503
                  diagonalValue = Sqrt(diagonalValue);
    
      3577503
                  TriangleRowEditor row_k = mLowerTriangular.getRowEditor(k);
    
      3577503
                  row_k.setValue(k, diagonalValue);
    
                  // Exploit the fact that the matrix is symmetric.
    
      3577503
                  typename MatrixType::ConstRow srcRow = matrix.getConstRow(k);
    
                  typename MatrixType::ConstValueIter citer = srcRow.cbegin();
    
        2/2✓ Branch 0 taken 24762455 times.
✓ Branch 1 taken 3577503 times.

      28339958
                  for ( ; citer; ++citer) {
    
                      SizeType ii = citer.column();
    
        2/2✓ Branch 0 taken 14169979 times.
✓ Branch 1 taken 10592476 times.

      24762455
                      if (ii < k+1) continue; // look above diagonal
    
      10592476
                      TriangleRowEditor row_ii = mLowerTriangular.getRowEditor(ii);
    
      10592476
                      row_ii.setValue(k, *citer / diagonalValue);
    
                  }
    
                  // for (j = k+1; j < size; ++j) replaced by row iter below
    
                  citer.reset(); // k,j entries
    
        2/2✓ Branch 0 taken 24762455 times.
✓ Branch 1 taken 3577503 times.

      28339958
                  for ( ; citer; ++citer) {
    
                      SizeType j = citer.column();
    
        2/2✓ Branch 0 taken 14169979 times.
✓ Branch 1 taken 10592476 times.

      24762455
                      if (j < k+1) continue;
    
      10592476
                      TriangleConstRow row_j = mLowerTriangular.getConstRow(j);
    
      10592476
                      ValueType a_jk = row_j.getValue(k);  // a_jk is non zero if a_kj is non zero
    
                      // Entry (i,j) is non-zero if matrix(j,i) is nonzero
    
      10592476
                      typename MatrixType::ConstRow mask = matrix.getConstRow(j);
    
                      typename MatrixType::ConstValueIter maskIter = mask.cbegin();
    
        2/2✓ Branch 0 taken 73563632 times.
✓ Branch 1 taken 10592476 times.

      84156108
                      for ( ; maskIter; ++maskIter) {
    
                          SizeType i = maskIter.column();
    
        2/2✓ Branch 0 taken 31555578 times.
✓ Branch 1 taken 42008054 times.

      73563632
                          if (i < j) continue;
    
      42008054
                          TriangleConstRow crow_i = mLowerTriangular.getConstRow(i);
    
      42008054
                          ValueType a_ij = crow_i.getValue(j);
    
      42008054
                          ValueType a_ik = crow_i.getValue(k);
    
      42008054
                          TriangleRowEditor row_i = mLowerTriangular.getRowEditor(i);
    
      42008054
                          a_ij -= a_ik * a_jk;
    
      42008054
                          row_i.setValue(j, a_ij);
    
                      }
    
                  }
    
              }
    
              // Build the transpose of the IC matrix: mUpperTriangular
    
        1/4✓ Branch 1 taken 8 times.
✗ Branch 2 not taken.
✗ Branch 3 not taken.
✗ Branch 4 not taken.

      8
              tbb::parallel_for(SizeRange(0, numRows),
    
                  TransposeOp(matrix, mLowerTriangular, mUpperTriangular));
    
      8
          }
    
        1/2✓ Branch 0 taken 8 times.
✗ Branch 1 not taken.

      46
          ~IncompleteCholeskyPreconditioner() override = default;
    
      7
          bool isValid() const override { return mPassedCompatibilityCondition; }
    
      468
          void apply(const Vector<ValueType>& rVec, Vector<ValueType>& zVec) override
    
          {
    
        1/2✗ Branch 0 not taken.
✓ Branch 1 taken 468 times.

      468
              if (!mPassedCompatibilityCondition) {
    
      ✗
                  OPENVDB_THROW(ArithmeticError, "invalid Cholesky decomposition");
    
              }
    
              // Solve mUpperTriangular * mLowerTriangular * rVec = zVec;
    
              SizeType size = mLowerTriangular.numRows();
    
              zVec.fill(zeroVal<ValueType>());
    
              ValueType* zData = zVec.data();
    
        1/2✓ Branch 0 taken 468 times.
✗ Branch 1 not taken.

      468
              if (size == 0) return;
    
        1/2✗ Branch 0 not taken.
✓ Branch 1 taken 468 times.

      468
              assert(rVec.size() == size);
    
        1/2✗ Branch 0 not taken.
✓ Branch 1 taken 468 times.

      468
              assert(zVec.size() == size);
    
              // Allocate a temp vector
    
              mTempVec.fill(zeroVal<ValueType>());
    
              ValueType* tmpData = mTempVec.data();
    
              const ValueType* rData = rVec.data();
    
              // Solve mLowerTriangular * tmp = rVec;
    
        2/2✓ Branch 0 taken 354001072 times.
✓ Branch 1 taken 468 times.

      354001540
              for (SizeType i = 0; i < size; ++i) {
    
      354001072
                  typename TriangularMatrix::ConstRow row = mLowerTriangular.getConstRow(i);
    
      354001072
                  ValueType diagonal = row.getValue(i);
    
                  ValueType dot = row.dot(mTempVec);
    
      354001072
                  tmpData[i] = (rData[i] - dot) / diagonal;
    
                  if (!std::isfinite(tmpData[i])) {
    
                      OPENVDB_LOG_DEBUG_RUNTIME("1 diagonal was " << diagonal);
    
                      OPENVDB_LOG_DEBUG_RUNTIME("1a diagonal " << row.getValue(i));
    
                  }
    
              }
    
              // Solve mUpperTriangular * zVec = tmp;
    
        2/2✓ Branch 0 taken 354001072 times.
✓ Branch 1 taken 468 times.

      354001540
              for (SizeType ii = 0; ii < size; ++ii) {
    
      354001072
                  SizeType i = size - 1 - ii;
    
      354001072
                  typename TriangularMatrix::ConstRow row = mUpperTriangular.getConstRow(i);
    
      354001072
                  ValueType diagonal = row.getValue(i);
    
                  ValueType dot = row.dot(zVec);
    
      354001072
                  zData[i] = (tmpData[i] - dot) / diagonal;
    
                  if (!std::isfinite(zData[i])) {
    
                      OPENVDB_LOG_DEBUG_RUNTIME("2 diagonal was " << diagonal);
    
                  }
    
              }
    
          }
    
          const TriangularMatrix& lowerMatrix() const { return mLowerTriangular; }
    
          const TriangularMatrix& upperMatrix() const { return mUpperTriangular; }
    
      private:
    
          // Functor for use with tbb::parallel_for()
    
          struct CopyToLowerOp
    
          {
    
        1/2✓ Branch 1 taken 8 times.
✗ Branch 2 not taken.

      8
              CopyToLowerOp(const MatrixType& m, TriangularMatrix& l): mat(&m), lower(&l) {}
    
      946
              void operator()(const SizeRange& range) const {
    
        2/2✓ Branch 0 taken 3577503 times.
✓ Branch 1 taken 946 times.

      3578449
                  for (SizeType n = range.begin(), N = range.end(); n < N; ++n) {
    
      3577503
                      typename TriangularMatrix::RowEditor outRow = lower->getRowEditor(n);
    
                      outRow.clear();
    
      3577503
                      typename MatrixType::ConstRow inRow = mat->getConstRow(n);
    
        2/2✓ Branch 0 taken 24762455 times.
✓ Branch 1 taken 3577503 times.

      28339958
                      for (typename MatrixType::ConstValueIter it = inRow.cbegin(); it; ++it) {
    
        2/2✓ Branch 0 taken 10592476 times.
✓ Branch 1 taken 14169979 times.

      24762455
                          if (it.column() > n) continue; // skip above diagonal
    
      14169979
                          outRow.setValue(it.column(), *it);
    
                      }
    
                  }
    
      946
              }
    
              const MatrixType* mat; TriangularMatrix* lower;
    
          };
    
          // Functor for use with tbb::parallel_for()
    
          struct TransposeOp
    
          {
    
      8
              TransposeOp(const MatrixType& m, const TriangularMatrix& l, TriangularMatrix& u):
    
        1/2✓ Branch 1 taken 8 times.
✗ Branch 2 not taken.

      8
                  mat(&m), lower(&l), upper(&u) {}
    
      971
              void operator()(const SizeRange& range) const {
    
        2/2✓ Branch 0 taken 3577503 times.
✓ Branch 1 taken 971 times.

      3578474
                  for (SizeType n = range.begin(), N = range.end(); n < N; ++n) {
    
      3577503
                      typename TriangularMatrix::RowEditor outRow = upper->getRowEditor(n);
    
                      outRow.clear();
    
                      // Use the fact that matrix is symmetric.
    
      3577503
                      typename MatrixType::ConstRow inRow = mat->getConstRow(n);
    
        2/2✓ Branch 0 taken 24762455 times.
✓ Branch 1 taken 3577503 times.

      28339958
                      for (typename MatrixType::ConstValueIter it = inRow.cbegin(); it; ++it) {
    
                          const SizeType column = it.column();
    
        2/2✓ Branch 0 taken 10592476 times.
✓ Branch 1 taken 14169979 times.

      24762455
                          if (column < n) continue; // only set upper triangle
    
      14169979
                          outRow.setValue(column, lower->getValue(column, n));
    
                      }
    
                  }
    
      971
              }
    
              const MatrixType* mat; const TriangularMatrix* lower; TriangularMatrix* upper;
    
          };
    
          TriangularMatrix  mLowerTriangular;
    
          TriangularMatrix  mUpperTriangular;
    
          Vector<ValueType> mTempVec;
    
          bool              mPassedCompatibilityCondition;
    
      }; // class IncompleteCholeskyPreconditioner
    
      ////////////////////////////////////////
    
      namespace internal {
    
      /// Compute @e ax + @e y.
    
      template<typename T>
    
      inline void
    
      axpy(const T& a, const T* xVec, const T* yVec, T* resultVec, SizeType size)
    
      {
    
      1404
          tbb::parallel_for(SizeRange(0, size), LinearOp<T>(a, xVec, yVec, resultVec));
    
      }
    
      /// Compute @e ax + @e y.
    
      template<typename T>
    
      inline void
    
      1404
      axpy(const T& a, const Vector<T>& xVec, const Vector<T>& yVec, Vector<T>& result)
    
      {
    
        1/2✗ Branch 0 not taken.
✓ Branch 1 taken 1404 times.

      1404
          assert(xVec.size() == yVec.size());
    
        1/2✗ Branch 0 not taken.
✓ Branch 1 taken 1404 times.

      1404
          assert(xVec.size() == result.size());
    
          axpy(a, xVec.data(), yVec.data(), result.data(), xVec.size());
    
      1404
      }
    
      /// Compute @e r = @e b &minus; @e Ax.
    
      template<typename MatrixOperator, typename VecValueType>
    
      inline void
    
      9
      computeResidual(const MatrixOperator& A, const VecValueType* x,
    
          const VecValueType* b, VecValueType* r)
    
      {
    
          // Compute r = A * x.
    
          A.vectorMultiply(x, r);
    
          // Compute r = b - r.
    
      9
          tbb::parallel_for(SizeRange(0, A.numRows()), LinearOp<VecValueType>(-1.0, r, b, r));
    
      9
      }
    
      /// Compute @e r = @e b &minus; @e Ax.
    
      template<typename MatrixOperator, typename T>
    
      inline void
    
      9
      computeResidual(const MatrixOperator& A, const Vector<T>& x, const Vector<T>& b, Vector<T>& r)
    
      {
    
        1/2✗ Branch 0 not taken.
✓ Branch 1 taken 9 times.

      9
          assert(x.size() == b.size());
    
        1/2✗ Branch 0 not taken.
✓ Branch 1 taken 9 times.

      9
          assert(x.size() == r.size());
    
        1/2✗ Branch 0 not taken.
✓ Branch 1 taken 9 times.

      9
          assert(x.size() == A.numRows());
    
      9
          computeResidual(A, x.data(), b.data(), r.data());
    
      9
      }
    
      } // namespace internal
    
      ////////////////////////////////////////
    
      template<typename PositiveDefMatrix>
    
      inline State
    
      solve(
    
          const PositiveDefMatrix& Amat,
    
          const Vector<typename PositiveDefMatrix::ValueType>& bVec,
    
          Vector<typename PositiveDefMatrix::ValueType>& xVec,
    
          Preconditioner<typename PositiveDefMatrix::ValueType>& precond,
    
          const State& termination)
    
      {
    
      2
          util::NullInterrupter interrupter;
    
        2/4✓ Branch 1 taken 1 times.
✗ Branch 2 not taken.
✓ Branch 4 taken 1 times.
✗ Branch 5 not taken.

      2
          return solve(Amat, bVec, xVec, precond, interrupter, termination);
    
      }
    
      template<typename PositiveDefMatrix, typename Interrupter>
    
      inline State
    
      9
      solve(
    
          const PositiveDefMatrix& Amat,
    
          const Vector<typename PositiveDefMatrix::ValueType>& bVec,
    
          Vector<typename PositiveDefMatrix::ValueType>& xVec,
    
          Preconditioner<typename PositiveDefMatrix::ValueType>& precond,
    
          Interrupter& interrupter,
    
          const State& termination)
    
      {
    
          using ValueType = typename PositiveDefMatrix::ValueType;
    
          using VectorType = Vector<ValueType>;
    
          State result;
    
      9
          result.success = false;
    
      9
          result.iterations = 0;
    
      9
          result.relativeError = 0.0;
    
      9
          result.absoluteError = 0.0;
    
          const SizeType size = Amat.numRows();
    
        1/2✗ Branch 0 not taken.
✓ Branch 1 taken 9 times.

      9
          if (size == 0) {
    
              OPENVDB_LOG_WARN("pcg::solve(): matrix has dimension zero");
    
              return result;
    
          }
    
        1/2✗ Branch 0 not taken.
✓ Branch 1 taken 9 times.

      9
          if (size != bVec.size()) {
    
      ✗
              OPENVDB_THROW(ArithmeticError, "A and b have incompatible sizes"
    
                  << size << "x" << size << " vs. " << bVec.size() << ")");
    
          }
    
        1/2✗ Branch 0 not taken.
✓ Branch 1 taken 9 times.

      9
          if (size != xVec.size()) {
    
      ✗
              OPENVDB_THROW(ArithmeticError, "A and x have incompatible sizes"
    
                  << size << "x" << size << " vs. " << xVec.size() << ")");
    
          }
    
          // Temp vectors
    
          VectorType zVec(size); // transformed residual (M^-1 r)
    
          VectorType pVec(size); // search direction
    
          VectorType qVec(size); // A * p
    
          // Compute norm of B (the source)
    
        1/2✓ Branch 1 taken 9 times.
✗ Branch 2 not taken.

      9
          const ValueType tmp = bVec.infNorm();
    
        1/2✓ Branch 0 taken 9 times.
✗ Branch 1 not taken.

      9
          const ValueType infNormOfB = isZero(tmp) ? ValueType(1) : tmp;
    
          // Compute rVec: residual = b - Ax.
    
          VectorType rVec(size); // vector of residuals
    
        1/2✓ Branch 1 taken 9 times.
✗ Branch 2 not taken.

      9
          internal::computeResidual(Amat, xVec, bVec, rVec);
    
        2/4✓ Branch 1 taken 9 times.
✗ Branch 2 not taken.
✗ Branch 3 not taken.
✓ Branch 4 taken 9 times.

      9
          assert(rVec.isFinite());
    
          // Normalize the residual norm with the source norm and look for early out.
    
        1/2✓ Branch 1 taken 9 times.
✗ Branch 2 not taken.

      9
          result.absoluteError = static_cast<double>(rVec.infNorm());
    
      9
          result.relativeError = static_cast<double>(result.absoluteError / infNormOfB);
    
        1/2✗ Branch 0 not taken.
✓ Branch 1 taken 9 times.

      9
          if (result.relativeError <= termination.relativeError) {
    
      ✗
              result.success = true;
    
      ✗
              return result;
    
          }
    
          // Iterations of the CG solve
    
          ValueType rDotZPrev(1); // inner product of <z,r>
    
          // Keep track of the minimum error to monitor convergence.
    
      9
          ValueType minL2Error = std::numeric_limits<ValueType>::max();
    
          ValueType l2Error;
    
          int iteration = 0;
    
        1/2✓ Branch 0 taken 471 times.
✗ Branch 1 not taken.

      471
          for ( ; iteration < termination.iterations; ++iteration) {
    
        2/4✓ Branch 1 taken 471 times.
✗ Branch 2 not taken.
✗ Branch 3 not taken.
✓ Branch 4 taken 471 times.

      471
              if (interrupter.wasInterrupted()) {
    
      ✗
                  OPENVDB_THROW(RuntimeError, "conjugate gradient solver was interrupted");
    
              }
    
              OPENVDB_LOG_DEBUG_RUNTIME("pcg::solve() " << result);
    
      471
              result.iterations = iteration + 1;
    
              // Apply preconditioner to residual
    
              // z_{k} = M^-1 r_{k}
    
        1/2✓ Branch 1 taken 471 times.
✗ Branch 2 not taken.

      471
              precond.apply(rVec, zVec);
    
              // <r,z>
    
        1/2✓ Branch 1 taken 471 times.
✗ Branch 2 not taken.

      471
              const ValueType rDotZ = rVec.dot(zVec);
    
        1/2✗ Branch 0 not taken.
✓ Branch 1 taken 471 times.

      471
              assert(std::isfinite(rDotZ));
    
        2/2✓ Branch 0 taken 9 times.
✓ Branch 1 taken 462 times.

      471
              if (0 == iteration) {
    
                  // Initialize
    
        1/2✓ Branch 1 taken 9 times.
✗ Branch 2 not taken.

      9
                  pVec = zVec;
    
              } else {
    
      462
                  const ValueType beta = rDotZ / rDotZPrev;
    
                  // p = beta * p + z
    
        1/2✓ Branch 1 taken 462 times.
✗ Branch 2 not taken.

      462
                  internal::axpy(beta, pVec, zVec, /*result */pVec);
    
              }
    
              // q_{k} = A p_{k}
    
        1/2✓ Branch 1 taken 471 times.
✗ Branch 2 not taken.

      471
              Amat.vectorMultiply(pVec, qVec);
    
              // alpha = <r_{k-1}, z_{k-1}> / <p_{k},q_{k}>
    
        1/2✓ Branch 1 taken 471 times.
✗ Branch 2 not taken.

      471
              const ValueType pAp = pVec.dot(qVec);
    
        1/2✗ Branch 0 not taken.
✓ Branch 1 taken 471 times.

      471
              assert(std::isfinite(pAp));
    
      471
              const ValueType alpha = rDotZ / pAp;
    
              rDotZPrev = rDotZ;
    
              // x_{k} = x_{k-1} + alpha * p_{k}
    
        1/2✓ Branch 1 taken 471 times.
✗ Branch 2 not taken.

      471
              internal::axpy(alpha, pVec, xVec, /*result=*/xVec);
    
              // r_{k} = r_{k-1} - alpha_{k-1} A p_{k}
    
        2/6✓ Branch 1 taken 471 times.
✗ Branch 2 not taken.
✓ Branch 4 taken 471 times.
✗ Branch 5 not taken.
✗ Branch 6 not taken.
✗ Branch 7 not taken.

      471
              internal::axpy(-alpha, qVec, rVec, /*result=*/rVec);
    
              // update tolerances
    
        2/2✓ Branch 0 taken 99 times.
✓ Branch 1 taken 372 times.

      471
              l2Error = rVec.l2Norm();
    
      471
              minL2Error = Min(l2Error, minL2Error);
    
        1/2✓ Branch 1 taken 471 times.
✗ Branch 2 not taken.

      471
              result.absoluteError = static_cast<double>(rVec.infNorm());
    
      471
              result.relativeError = static_cast<double>(result.absoluteError / infNormOfB);
    
        1/2✗ Branch 0 not taken.
✓ Branch 1 taken 471 times.

      471
              if (l2Error > 2 * minL2Error) {
    
                  // The solution started to diverge.
    
      ✗
                  result.success = false;
    
      9
                  break;
    
              }
    
        1/2✗ Branch 0 not taken.
✓ Branch 1 taken 471 times.

      471
              if (!std::isfinite(result.absoluteError)) {
    
                  // Total divergence of solution
    
      ✗
                  result.success = false;
    
      ✗
                  break;
    
              }
    
        2/2✓ Branch 0 taken 6 times.
✓ Branch 1 taken 465 times.

      471
              if (result.absoluteError <= termination.absoluteError) {
    
                  // Convergence
    
      6
                  result.success = true;
    
      6
                  break;
    
              }
    
        2/2✓ Branch 0 taken 3 times.
✓ Branch 1 taken 462 times.

      465
              if (result.relativeError <= termination.relativeError) {
    
                  // Convergence
    
      3
                  result.success = true;
    
      3
                  break;
    
              }
    
          }
    
          OPENVDB_LOG_DEBUG_RUNTIME("pcg::solve() " << result);
    
          return result;
    
      }
    
      } // namespace pcg
    
      } // namespace math
    
      } // namespace OPENVDB_VERSION_NAME
    
      } // namespace openvdb
    
      #endif // OPENVDB_MATH_CONJGRADIENT_HAS_BEEN_INCLUDED