src/SparseLU/SparseLU.h

*bf2c3715SXin Li// This file is part of Eigen, a lightweight C++ template library
*bf2c3715SXin Li// for linear algebra.
*bf2c3715SXin Li//
*bf2c3715SXin Li// Copyright (C) 2012 Désiré Nuentsa-Wakam <[email protected]>
*bf2c3715SXin Li// Copyright (C) 2012-2014 Gael Guennebaud <[email protected]>
*bf2c3715SXin Li//
*bf2c3715SXin Li// This Source Code Form is subject to the terms of the Mozilla
*bf2c3715SXin Li// Public License v. 2.0. If a copy of the MPL was not distributed
*bf2c3715SXin Li// with this file, You can obtain one at http://mozilla.org/MPL/2.0/.
*bf2c3715SXin Li
*bf2c3715SXin Li
*bf2c3715SXin Li#ifndef EIGEN_SPARSE_LU_H
*bf2c3715SXin Li#define EIGEN_SPARSE_LU_H
*bf2c3715SXin Li
*bf2c3715SXin Linamespace Eigen {
*bf2c3715SXin Li
*bf2c3715SXin Litemplate <typename _MatrixType, typename _OrderingType = COLAMDOrdering<typename _MatrixType::StorageIndex> > class SparseLU;
*bf2c3715SXin Litemplate <typename MappedSparseMatrixType> struct SparseLUMatrixLReturnType;
*bf2c3715SXin Litemplate <typename MatrixLType, typename MatrixUType> struct SparseLUMatrixUReturnType;
*bf2c3715SXin Li
*bf2c3715SXin Litemplate <bool Conjugate,class SparseLUType>
*bf2c3715SXin Liclass SparseLUTransposeView : public SparseSolverBase<SparseLUTransposeView<Conjugate,SparseLUType> >
*bf2c3715SXin Li{
*bf2c3715SXin Liprotected:
*bf2c3715SXin Li  typedef SparseSolverBase<SparseLUTransposeView<Conjugate,SparseLUType> > APIBase;
*bf2c3715SXin Li  using APIBase::m_isInitialized;
*bf2c3715SXin Lipublic:
*bf2c3715SXin Li  typedef typename SparseLUType::Scalar Scalar;
*bf2c3715SXin Li  typedef typename SparseLUType::StorageIndex StorageIndex;
*bf2c3715SXin Li  typedef typename SparseLUType::MatrixType MatrixType;
*bf2c3715SXin Li  typedef typename SparseLUType::OrderingType OrderingType;
*bf2c3715SXin Li
*bf2c3715SXin Li  enum {
*bf2c3715SXin Li    ColsAtCompileTime = MatrixType::ColsAtCompileTime,
*bf2c3715SXin Li    MaxColsAtCompileTime = MatrixType::MaxColsAtCompileTime
*bf2c3715SXin Li  };
*bf2c3715SXin Li
*bf2c3715SXin Li  SparseLUTransposeView() : m_sparseLU(NULL) {}
*bf2c3715SXin Li  SparseLUTransposeView(const SparseLUTransposeView& view) {
*bf2c3715SXin Li    this->m_sparseLU = view.m_sparseLU;
*bf2c3715SXin Li  }
*bf2c3715SXin Li  void setIsInitialized(const bool isInitialized) {this->m_isInitialized = isInitialized;}
*bf2c3715SXin Li  void setSparseLU(SparseLUType* sparseLU) {m_sparseLU = sparseLU;}
*bf2c3715SXin Li  using APIBase::_solve_impl;
*bf2c3715SXin Li  template<typename Rhs, typename Dest>
*bf2c3715SXin Li  bool _solve_impl(const MatrixBase<Rhs> &B, MatrixBase<Dest> &X_base) const
*bf2c3715SXin Li  {
*bf2c3715SXin Li    Dest& X(X_base.derived());
*bf2c3715SXin Li    eigen_assert(m_sparseLU->info() == Success && "The matrix should be factorized first");
*bf2c3715SXin Li    EIGEN_STATIC_ASSERT((Dest::Flags&RowMajorBit)==0,
*bf2c3715SXin Li                        THIS_METHOD_IS_ONLY_FOR_COLUMN_MAJOR_MATRICES);
*bf2c3715SXin Li
*bf2c3715SXin Li
*bf2c3715SXin Li    // this ugly const_cast_derived() helps to detect aliasing when applying the permutations
*bf2c3715SXin Li    for(Index j = 0; j < B.cols(); ++j){
*bf2c3715SXin Li      X.col(j) = m_sparseLU->colsPermutation() * B.const_cast_derived().col(j);
*bf2c3715SXin Li    }
*bf2c3715SXin Li    //Forward substitution with transposed or adjoint of U
*bf2c3715SXin Li    m_sparseLU->matrixU().template solveTransposedInPlace<Conjugate>(X);
*bf2c3715SXin Li
*bf2c3715SXin Li    //Backward substitution with transposed or adjoint of L
*bf2c3715SXin Li    m_sparseLU->matrixL().template solveTransposedInPlace<Conjugate>(X);
*bf2c3715SXin Li
*bf2c3715SXin Li    // Permute back the solution
*bf2c3715SXin Li    for (Index j = 0; j < B.cols(); ++j)
*bf2c3715SXin Li      X.col(j) = m_sparseLU->rowsPermutation().transpose() * X.col(j);
*bf2c3715SXin Li    return true;
*bf2c3715SXin Li  }
*bf2c3715SXin Li  inline Index rows() const { return m_sparseLU->rows(); }
*bf2c3715SXin Li  inline Index cols() const { return m_sparseLU->cols(); }
*bf2c3715SXin Li
*bf2c3715SXin Liprivate:
*bf2c3715SXin Li  SparseLUType *m_sparseLU;
*bf2c3715SXin Li  SparseLUTransposeView& operator=(const SparseLUTransposeView&);
*bf2c3715SXin Li};
*bf2c3715SXin Li
*bf2c3715SXin Li
*bf2c3715SXin Li/** \ingroup SparseLU_Module
*bf2c3715SXin Li  * \class SparseLU
*bf2c3715SXin Li  *
*bf2c3715SXin Li  * \brief Sparse supernodal LU factorization for general matrices
*bf2c3715SXin Li  *
*bf2c3715SXin Li  * This class implements the supernodal LU factorization for general matrices.
*bf2c3715SXin Li  * It uses the main techniques from the sequential SuperLU package
*bf2c3715SXin Li  * (http://crd-legacy.lbl.gov/~xiaoye/SuperLU/). It handles transparently real
*bf2c3715SXin Li  * and complex arithmetic with single and double precision, depending on the
*bf2c3715SXin Li  * scalar type of your input matrix.
*bf2c3715SXin Li  * The code has been optimized to provide BLAS-3 operations during supernode-panel updates.
*bf2c3715SXin Li  * It benefits directly from the built-in high-performant Eigen BLAS routines.
*bf2c3715SXin Li  * Moreover, when the size of a supernode is very small, the BLAS calls are avoided to
*bf2c3715SXin Li  * enable a better optimization from the compiler. For best performance,
*bf2c3715SXin Li  * you should compile it with NDEBUG flag to avoid the numerous bounds checking on vectors.
*bf2c3715SXin Li  *
*bf2c3715SXin Li  * An important parameter of this class is the ordering method. It is used to reorder the columns
*bf2c3715SXin Li  * (and eventually the rows) of the matrix to reduce the number of new elements that are created during
*bf2c3715SXin Li  * numerical factorization. The cheapest method available is COLAMD.
*bf2c3715SXin Li  * See  \link OrderingMethods_Module the OrderingMethods module \endlink for the list of
*bf2c3715SXin Li  * built-in and external ordering methods.
*bf2c3715SXin Li  *
*bf2c3715SXin Li  * Simple example with key steps
*bf2c3715SXin Li  * \code
*bf2c3715SXin Li  * VectorXd x(n), b(n);
*bf2c3715SXin Li  * SparseMatrix<double> A;
*bf2c3715SXin Li  * SparseLU<SparseMatrix<double>, COLAMDOrdering<int> >   solver;
*bf2c3715SXin Li  * // fill A and b;
*bf2c3715SXin Li  * // Compute the ordering permutation vector from the structural pattern of A
*bf2c3715SXin Li  * solver.analyzePattern(A);
*bf2c3715SXin Li  * // Compute the numerical factorization
*bf2c3715SXin Li  * solver.factorize(A);
*bf2c3715SXin Li  * //Use the factors to solve the linear system
*bf2c3715SXin Li  * x = solver.solve(b);
*bf2c3715SXin Li  * \endcode
*bf2c3715SXin Li  *
*bf2c3715SXin Li  * \warning The input matrix A should be in a \b compressed and \b column-major form.
*bf2c3715SXin Li  * Otherwise an expensive copy will be made. You can call the inexpensive makeCompressed() to get a compressed matrix.
*bf2c3715SXin Li  *
*bf2c3715SXin Li  * \note Unlike the initial SuperLU implementation, there is no step to equilibrate the matrix.
*bf2c3715SXin Li  * For badly scaled matrices, this step can be useful to reduce the pivoting during factorization.
*bf2c3715SXin Li  * If this is the case for your matrices, you can try the basic scaling method at
*bf2c3715SXin Li  *  "unsupported/Eigen/src/IterativeSolvers/Scaling.h"
*bf2c3715SXin Li  *
*bf2c3715SXin Li  * \tparam _MatrixType The type of the sparse matrix. It must be a column-major SparseMatrix<>
*bf2c3715SXin Li  * \tparam _OrderingType The ordering method to use, either AMD, COLAMD or METIS. Default is COLMAD
*bf2c3715SXin Li  *
*bf2c3715SXin Li  * \implsparsesolverconcept
*bf2c3715SXin Li  *
*bf2c3715SXin Li  * \sa \ref TutorialSparseSolverConcept
*bf2c3715SXin Li  * \sa \ref OrderingMethods_Module
*bf2c3715SXin Li  */
*bf2c3715SXin Litemplate <typename _MatrixType, typename _OrderingType>
*bf2c3715SXin Liclass SparseLU : public SparseSolverBase<SparseLU<_MatrixType,_OrderingType> >, public internal::SparseLUImpl<typename _MatrixType::Scalar, typename _MatrixType::StorageIndex>
*bf2c3715SXin Li{
*bf2c3715SXin Li  protected:
*bf2c3715SXin Li    typedef SparseSolverBase<SparseLU<_MatrixType,_OrderingType> > APIBase;
*bf2c3715SXin Li    using APIBase::m_isInitialized;
*bf2c3715SXin Li  public:
*bf2c3715SXin Li    using APIBase::_solve_impl;
*bf2c3715SXin Li
*bf2c3715SXin Li    typedef _MatrixType MatrixType;
*bf2c3715SXin Li    typedef _OrderingType OrderingType;
*bf2c3715SXin Li    typedef typename MatrixType::Scalar Scalar;
*bf2c3715SXin Li    typedef typename MatrixType::RealScalar RealScalar;
*bf2c3715SXin Li    typedef typename MatrixType::StorageIndex StorageIndex;
*bf2c3715SXin Li    typedef SparseMatrix<Scalar,ColMajor,StorageIndex> NCMatrix;
*bf2c3715SXin Li    typedef internal::MappedSuperNodalMatrix<Scalar, StorageIndex> SCMatrix;
*bf2c3715SXin Li    typedef Matrix<Scalar,Dynamic,1> ScalarVector;
*bf2c3715SXin Li    typedef Matrix<StorageIndex,Dynamic,1> IndexVector;
*bf2c3715SXin Li    typedef PermutationMatrix<Dynamic, Dynamic, StorageIndex> PermutationType;
*bf2c3715SXin Li    typedef internal::SparseLUImpl<Scalar, StorageIndex> Base;
*bf2c3715SXin Li
*bf2c3715SXin Li    enum {
*bf2c3715SXin Li      ColsAtCompileTime = MatrixType::ColsAtCompileTime,
*bf2c3715SXin Li      MaxColsAtCompileTime = MatrixType::MaxColsAtCompileTime
*bf2c3715SXin Li    };
*bf2c3715SXin Li
*bf2c3715SXin Li  public:
*bf2c3715SXin Li
*bf2c3715SXin Li    SparseLU():m_lastError(""),m_Ustore(0,0,0,0,0,0),m_symmetricmode(false),m_diagpivotthresh(1.0),m_detPermR(1)
*bf2c3715SXin Li    {
*bf2c3715SXin Li      initperfvalues();
*bf2c3715SXin Li    }
*bf2c3715SXin Li    explicit SparseLU(const MatrixType& matrix)
*bf2c3715SXin Li      : m_lastError(""),m_Ustore(0,0,0,0,0,0),m_symmetricmode(false),m_diagpivotthresh(1.0),m_detPermR(1)
*bf2c3715SXin Li    {
*bf2c3715SXin Li      initperfvalues();
*bf2c3715SXin Li      compute(matrix);
*bf2c3715SXin Li    }
*bf2c3715SXin Li
*bf2c3715SXin Li    ~SparseLU()
*bf2c3715SXin Li    {
*bf2c3715SXin Li      // Free all explicit dynamic pointers
*bf2c3715SXin Li    }
*bf2c3715SXin Li
*bf2c3715SXin Li    void analyzePattern (const MatrixType& matrix);
*bf2c3715SXin Li    void factorize (const MatrixType& matrix);
*bf2c3715SXin Li    void simplicialfactorize(const MatrixType& matrix);
*bf2c3715SXin Li
*bf2c3715SXin Li    /**
*bf2c3715SXin Li      * Compute the symbolic and numeric factorization of the input sparse matrix.
*bf2c3715SXin Li      * The input matrix should be in column-major storage.
*bf2c3715SXin Li      */
*bf2c3715SXin Li    void compute (const MatrixType& matrix)
*bf2c3715SXin Li    {
*bf2c3715SXin Li      // Analyze
*bf2c3715SXin Li      analyzePattern(matrix);
*bf2c3715SXin Li      //Factorize
*bf2c3715SXin Li      factorize(matrix);
*bf2c3715SXin Li    }
*bf2c3715SXin Li
*bf2c3715SXin Li    /** \returns an expression of the transposed of the factored matrix.
*bf2c3715SXin Li      *
*bf2c3715SXin Li      * A typical usage is to solve for the transposed problem A^T x = b:
*bf2c3715SXin Li      * \code
*bf2c3715SXin Li      * solver.compute(A);
*bf2c3715SXin Li      * x = solver.transpose().solve(b);
*bf2c3715SXin Li      * \endcode
*bf2c3715SXin Li      *
*bf2c3715SXin Li      * \sa adjoint(), solve()
*bf2c3715SXin Li      */
*bf2c3715SXin Li    const SparseLUTransposeView<false,SparseLU<_MatrixType,_OrderingType> > transpose()
*bf2c3715SXin Li    {
*bf2c3715SXin Li      SparseLUTransposeView<false,  SparseLU<_MatrixType,_OrderingType> > transposeView;
*bf2c3715SXin Li      transposeView.setSparseLU(this);
*bf2c3715SXin Li      transposeView.setIsInitialized(this->m_isInitialized);
*bf2c3715SXin Li      return transposeView;
*bf2c3715SXin Li    }
*bf2c3715SXin Li
*bf2c3715SXin Li
*bf2c3715SXin Li    /** \returns an expression of the adjoint of the factored matrix
*bf2c3715SXin Li      *
*bf2c3715SXin Li      * A typical usage is to solve for the adjoint problem A' x = b:
*bf2c3715SXin Li      * \code
*bf2c3715SXin Li      * solver.compute(A);
*bf2c3715SXin Li      * x = solver.adjoint().solve(b);
*bf2c3715SXin Li      * \endcode
*bf2c3715SXin Li      *
*bf2c3715SXin Li      * For real scalar types, this function is equivalent to transpose().
*bf2c3715SXin Li      *
*bf2c3715SXin Li      * \sa transpose(), solve()
*bf2c3715SXin Li      */
*bf2c3715SXin Li    const SparseLUTransposeView<true, SparseLU<_MatrixType,_OrderingType> > adjoint()
*bf2c3715SXin Li    {
*bf2c3715SXin Li      SparseLUTransposeView<true,  SparseLU<_MatrixType,_OrderingType> > adjointView;
*bf2c3715SXin Li      adjointView.setSparseLU(this);
*bf2c3715SXin Li      adjointView.setIsInitialized(this->m_isInitialized);
*bf2c3715SXin Li      return adjointView;
*bf2c3715SXin Li    }
*bf2c3715SXin Li
*bf2c3715SXin Li    inline Index rows() const { return m_mat.rows(); }
*bf2c3715SXin Li    inline Index cols() const { return m_mat.cols(); }
*bf2c3715SXin Li    /** Indicate that the pattern of the input matrix is symmetric */
*bf2c3715SXin Li    void isSymmetric(bool sym)
*bf2c3715SXin Li    {
*bf2c3715SXin Li      m_symmetricmode = sym;
*bf2c3715SXin Li    }
*bf2c3715SXin Li
*bf2c3715SXin Li    /** \returns an expression of the matrix L, internally stored as supernodes
*bf2c3715SXin Li      * The only operation available with this expression is the triangular solve
*bf2c3715SXin Li      * \code
*bf2c3715SXin Li      * y = b; matrixL().solveInPlace(y);
*bf2c3715SXin Li      * \endcode
*bf2c3715SXin Li      */
*bf2c3715SXin Li    SparseLUMatrixLReturnType<SCMatrix> matrixL() const
*bf2c3715SXin Li    {
*bf2c3715SXin Li      return SparseLUMatrixLReturnType<SCMatrix>(m_Lstore);
*bf2c3715SXin Li    }
*bf2c3715SXin Li    /** \returns an expression of the matrix U,
*bf2c3715SXin Li      * The only operation available with this expression is the triangular solve
*bf2c3715SXin Li      * \code
*bf2c3715SXin Li      * y = b; matrixU().solveInPlace(y);
*bf2c3715SXin Li      * \endcode
*bf2c3715SXin Li      */
*bf2c3715SXin Li    SparseLUMatrixUReturnType<SCMatrix,MappedSparseMatrix<Scalar,ColMajor,StorageIndex> > matrixU() const
*bf2c3715SXin Li    {
*bf2c3715SXin Li      return SparseLUMatrixUReturnType<SCMatrix, MappedSparseMatrix<Scalar,ColMajor,StorageIndex> >(m_Lstore, m_Ustore);
*bf2c3715SXin Li    }
*bf2c3715SXin Li
*bf2c3715SXin Li    /**
*bf2c3715SXin Li      * \returns a reference to the row matrix permutation \f$ P_r \f$ such that \f$P_r A P_c^T = L U\f$
*bf2c3715SXin Li      * \sa colsPermutation()
*bf2c3715SXin Li      */
*bf2c3715SXin Li    inline const PermutationType& rowsPermutation() const
*bf2c3715SXin Li    {
*bf2c3715SXin Li      return m_perm_r;
*bf2c3715SXin Li    }
*bf2c3715SXin Li    /**
*bf2c3715SXin Li      * \returns a reference to the column matrix permutation\f$ P_c^T \f$ such that \f$P_r A P_c^T = L U\f$
*bf2c3715SXin Li      * \sa rowsPermutation()
*bf2c3715SXin Li      */
*bf2c3715SXin Li    inline const PermutationType& colsPermutation() const
*bf2c3715SXin Li    {
*bf2c3715SXin Li      return m_perm_c;
*bf2c3715SXin Li    }
*bf2c3715SXin Li    /** Set the threshold used for a diagonal entry to be an acceptable pivot. */
*bf2c3715SXin Li    void setPivotThreshold(const RealScalar& thresh)
*bf2c3715SXin Li    {
*bf2c3715SXin Li      m_diagpivotthresh = thresh;
*bf2c3715SXin Li    }
*bf2c3715SXin Li
*bf2c3715SXin Li#ifdef EIGEN_PARSED_BY_DOXYGEN
*bf2c3715SXin Li    /** \returns the solution X of \f$ A X = B \f$ using the current decomposition of A.
*bf2c3715SXin Li      *
*bf2c3715SXin Li      * \warning the destination matrix X in X = this->solve(B) must be colmun-major.
*bf2c3715SXin Li      *
*bf2c3715SXin Li      * \sa compute()
*bf2c3715SXin Li      */
*bf2c3715SXin Li    template<typename Rhs>
*bf2c3715SXin Li    inline const Solve<SparseLU, Rhs> solve(const MatrixBase<Rhs>& B) const;
*bf2c3715SXin Li#endif // EIGEN_PARSED_BY_DOXYGEN
*bf2c3715SXin Li
*bf2c3715SXin Li    /** \brief Reports whether previous computation was successful.
*bf2c3715SXin Li      *
*bf2c3715SXin Li      * \returns \c Success if computation was successful,
*bf2c3715SXin Li      *          \c NumericalIssue if the LU factorization reports a problem, zero diagonal for instance
*bf2c3715SXin Li      *          \c InvalidInput if the input matrix is invalid
*bf2c3715SXin Li      *
*bf2c3715SXin Li      * \sa iparm()
*bf2c3715SXin Li      */
*bf2c3715SXin Li    ComputationInfo info() const
*bf2c3715SXin Li    {
*bf2c3715SXin Li      eigen_assert(m_isInitialized && "Decomposition is not initialized.");
*bf2c3715SXin Li      return m_info;
*bf2c3715SXin Li    }
*bf2c3715SXin Li
*bf2c3715SXin Li    /**
*bf2c3715SXin Li      * \returns A string describing the type of error
*bf2c3715SXin Li      */
*bf2c3715SXin Li    std::string lastErrorMessage() const
*bf2c3715SXin Li    {
*bf2c3715SXin Li      return m_lastError;
*bf2c3715SXin Li    }
*bf2c3715SXin Li
*bf2c3715SXin Li    template<typename Rhs, typename Dest>
*bf2c3715SXin Li    bool _solve_impl(const MatrixBase<Rhs> &B, MatrixBase<Dest> &X_base) const
*bf2c3715SXin Li    {
*bf2c3715SXin Li      Dest& X(X_base.derived());
*bf2c3715SXin Li      eigen_assert(m_factorizationIsOk && "The matrix should be factorized first");
*bf2c3715SXin Li      EIGEN_STATIC_ASSERT((Dest::Flags&RowMajorBit)==0,
*bf2c3715SXin Li                        THIS_METHOD_IS_ONLY_FOR_COLUMN_MAJOR_MATRICES);
*bf2c3715SXin Li
*bf2c3715SXin Li      // Permute the right hand side to form X = Pr*B
*bf2c3715SXin Li      // on return, X is overwritten by the computed solution
*bf2c3715SXin Li      X.resize(B.rows(),B.cols());
*bf2c3715SXin Li
*bf2c3715SXin Li      // this ugly const_cast_derived() helps to detect aliasing when applying the permutations
*bf2c3715SXin Li      for(Index j = 0; j < B.cols(); ++j)
*bf2c3715SXin Li        X.col(j) = rowsPermutation() * B.const_cast_derived().col(j);
*bf2c3715SXin Li
*bf2c3715SXin Li      //Forward substitution with L
*bf2c3715SXin Li      this->matrixL().solveInPlace(X);
*bf2c3715SXin Li      this->matrixU().solveInPlace(X);
*bf2c3715SXin Li
*bf2c3715SXin Li      // Permute back the solution
*bf2c3715SXin Li      for (Index j = 0; j < B.cols(); ++j)
*bf2c3715SXin Li        X.col(j) = colsPermutation().inverse() * X.col(j);
*bf2c3715SXin Li
*bf2c3715SXin Li      return true;
*bf2c3715SXin Li    }
*bf2c3715SXin Li
*bf2c3715SXin Li    /**
*bf2c3715SXin Li      * \returns the absolute value of the determinant of the matrix of which
*bf2c3715SXin Li      * *this is the QR decomposition.
*bf2c3715SXin Li      *
*bf2c3715SXin Li      * \warning a determinant can be very big or small, so for matrices
*bf2c3715SXin Li      * of large enough dimension, there is a risk of overflow/underflow.
*bf2c3715SXin Li      * One way to work around that is to use logAbsDeterminant() instead.
*bf2c3715SXin Li      *
*bf2c3715SXin Li      * \sa logAbsDeterminant(), signDeterminant()
*bf2c3715SXin Li      */
*bf2c3715SXin Li    Scalar absDeterminant()
*bf2c3715SXin Li    {
*bf2c3715SXin Li      using std::abs;
*bf2c3715SXin Li      eigen_assert(m_factorizationIsOk && "The matrix should be factorized first.");
*bf2c3715SXin Li      // Initialize with the determinant of the row matrix
*bf2c3715SXin Li      Scalar det = Scalar(1.);
*bf2c3715SXin Li      // Note that the diagonal blocks of U are stored in supernodes,
*bf2c3715SXin Li      // which are available in the  L part :)
*bf2c3715SXin Li      for (Index j = 0; j < this->cols(); ++j)
*bf2c3715SXin Li      {
*bf2c3715SXin Li        for (typename SCMatrix::InnerIterator it(m_Lstore, j); it; ++it)
*bf2c3715SXin Li        {
*bf2c3715SXin Li          if(it.index() == j)
*bf2c3715SXin Li          {
*bf2c3715SXin Li            det *= abs(it.value());
*bf2c3715SXin Li            break;
*bf2c3715SXin Li          }
*bf2c3715SXin Li        }
*bf2c3715SXin Li      }
*bf2c3715SXin Li      return det;
*bf2c3715SXin Li    }
*bf2c3715SXin Li
*bf2c3715SXin Li    /** \returns the natural log of the absolute value of the determinant of the matrix
*bf2c3715SXin Li      * of which **this is the QR decomposition
*bf2c3715SXin Li      *
*bf2c3715SXin Li      * \note This method is useful to work around the risk of overflow/underflow that's
*bf2c3715SXin Li      * inherent to the determinant computation.
*bf2c3715SXin Li      *
*bf2c3715SXin Li      * \sa absDeterminant(), signDeterminant()
*bf2c3715SXin Li      */
*bf2c3715SXin Li    Scalar logAbsDeterminant() const
*bf2c3715SXin Li    {
*bf2c3715SXin Li      using std::log;
*bf2c3715SXin Li      using std::abs;
*bf2c3715SXin Li
*bf2c3715SXin Li      eigen_assert(m_factorizationIsOk && "The matrix should be factorized first.");
*bf2c3715SXin Li      Scalar det = Scalar(0.);
*bf2c3715SXin Li      for (Index j = 0; j < this->cols(); ++j)
*bf2c3715SXin Li      {
*bf2c3715SXin Li        for (typename SCMatrix::InnerIterator it(m_Lstore, j); it; ++it)
*bf2c3715SXin Li        {
*bf2c3715SXin Li          if(it.row() < j) continue;
*bf2c3715SXin Li          if(it.row() == j)
*bf2c3715SXin Li          {
*bf2c3715SXin Li            det += log(abs(it.value()));
*bf2c3715SXin Li            break;
*bf2c3715SXin Li          }
*bf2c3715SXin Li        }
*bf2c3715SXin Li      }
*bf2c3715SXin Li      return det;
*bf2c3715SXin Li    }
*bf2c3715SXin Li
*bf2c3715SXin Li    /** \returns A number representing the sign of the determinant
*bf2c3715SXin Li      *
*bf2c3715SXin Li      * \sa absDeterminant(), logAbsDeterminant()
*bf2c3715SXin Li      */
*bf2c3715SXin Li    Scalar signDeterminant()
*bf2c3715SXin Li    {
*bf2c3715SXin Li      eigen_assert(m_factorizationIsOk && "The matrix should be factorized first.");
*bf2c3715SXin Li      // Initialize with the determinant of the row matrix
*bf2c3715SXin Li      Index det = 1;
*bf2c3715SXin Li      // Note that the diagonal blocks of U are stored in supernodes,
*bf2c3715SXin Li      // which are available in the  L part :)
*bf2c3715SXin Li      for (Index j = 0; j < this->cols(); ++j)
*bf2c3715SXin Li      {
*bf2c3715SXin Li        for (typename SCMatrix::InnerIterator it(m_Lstore, j); it; ++it)
*bf2c3715SXin Li        {
*bf2c3715SXin Li          if(it.index() == j)
*bf2c3715SXin Li          {
*bf2c3715SXin Li            if(it.value()<0)
*bf2c3715SXin Li              det = -det;
*bf2c3715SXin Li            else if(it.value()==0)
*bf2c3715SXin Li              return 0;
*bf2c3715SXin Li            break;
*bf2c3715SXin Li          }
*bf2c3715SXin Li        }
*bf2c3715SXin Li      }
*bf2c3715SXin Li      return det * m_detPermR * m_detPermC;
*bf2c3715SXin Li    }
*bf2c3715SXin Li
*bf2c3715SXin Li    /** \returns The determinant of the matrix.
*bf2c3715SXin Li      *
*bf2c3715SXin Li      * \sa absDeterminant(), logAbsDeterminant()
*bf2c3715SXin Li      */
*bf2c3715SXin Li    Scalar determinant()
*bf2c3715SXin Li    {
*bf2c3715SXin Li      eigen_assert(m_factorizationIsOk && "The matrix should be factorized first.");
*bf2c3715SXin Li      // Initialize with the determinant of the row matrix
*bf2c3715SXin Li      Scalar det = Scalar(1.);
*bf2c3715SXin Li      // Note that the diagonal blocks of U are stored in supernodes,
*bf2c3715SXin Li      // which are available in the  L part :)
*bf2c3715SXin Li      for (Index j = 0; j < this->cols(); ++j)
*bf2c3715SXin Li      {
*bf2c3715SXin Li        for (typename SCMatrix::InnerIterator it(m_Lstore, j); it; ++it)
*bf2c3715SXin Li        {
*bf2c3715SXin Li          if(it.index() == j)
*bf2c3715SXin Li          {
*bf2c3715SXin Li            det *= it.value();
*bf2c3715SXin Li            break;
*bf2c3715SXin Li          }
*bf2c3715SXin Li        }
*bf2c3715SXin Li      }
*bf2c3715SXin Li      return (m_detPermR * m_detPermC) > 0 ? det : -det;
*bf2c3715SXin Li    }
*bf2c3715SXin Li
*bf2c3715SXin Li    Index nnzL() const { return m_nnzL; };
*bf2c3715SXin Li    Index nnzU() const { return m_nnzU; };
*bf2c3715SXin Li
*bf2c3715SXin Li  protected:
*bf2c3715SXin Li    // Functions
*bf2c3715SXin Li    void initperfvalues()
*bf2c3715SXin Li    {
*bf2c3715SXin Li      m_perfv.panel_size = 16;
*bf2c3715SXin Li      m_perfv.relax = 1;
*bf2c3715SXin Li      m_perfv.maxsuper = 128;
*bf2c3715SXin Li      m_perfv.rowblk = 16;
*bf2c3715SXin Li      m_perfv.colblk = 8;
*bf2c3715SXin Li      m_perfv.fillfactor = 20;
*bf2c3715SXin Li    }
*bf2c3715SXin Li
*bf2c3715SXin Li    // Variables
*bf2c3715SXin Li    mutable ComputationInfo m_info;
*bf2c3715SXin Li    bool m_factorizationIsOk;
*bf2c3715SXin Li    bool m_analysisIsOk;
*bf2c3715SXin Li    std::string m_lastError;
*bf2c3715SXin Li    NCMatrix m_mat; // The input (permuted ) matrix
*bf2c3715SXin Li    SCMatrix m_Lstore; // The lower triangular matrix (supernodal)
*bf2c3715SXin Li    MappedSparseMatrix<Scalar,ColMajor,StorageIndex> m_Ustore; // The upper triangular matrix
*bf2c3715SXin Li    PermutationType m_perm_c; // Column permutation
*bf2c3715SXin Li    PermutationType m_perm_r ; // Row permutation
*bf2c3715SXin Li    IndexVector m_etree; // Column elimination tree
*bf2c3715SXin Li
*bf2c3715SXin Li    typename Base::GlobalLU_t m_glu;
*bf2c3715SXin Li
*bf2c3715SXin Li    // SparseLU options
*bf2c3715SXin Li    bool m_symmetricmode;
*bf2c3715SXin Li    // values for performance
*bf2c3715SXin Li    internal::perfvalues m_perfv;
*bf2c3715SXin Li    RealScalar m_diagpivotthresh; // Specifies the threshold used for a diagonal entry to be an acceptable pivot
*bf2c3715SXin Li    Index m_nnzL, m_nnzU; // Nonzeros in L and U factors
*bf2c3715SXin Li    Index m_detPermR, m_detPermC; // Determinants of the permutation matrices
*bf2c3715SXin Li  private:
*bf2c3715SXin Li    // Disable copy constructor
*bf2c3715SXin Li    SparseLU (const SparseLU& );
*bf2c3715SXin Li}; // End class SparseLU
*bf2c3715SXin Li
*bf2c3715SXin Li
*bf2c3715SXin Li
*bf2c3715SXin Li// Functions needed by the anaysis phase
*bf2c3715SXin Li/**
*bf2c3715SXin Li  * Compute the column permutation to minimize the fill-in
*bf2c3715SXin Li  *
*bf2c3715SXin Li  *  - Apply this permutation to the input matrix -
*bf2c3715SXin Li  *
*bf2c3715SXin Li  *  - Compute the column elimination tree on the permuted matrix
*bf2c3715SXin Li  *
*bf2c3715SXin Li  *  - Postorder the elimination tree and the column permutation
*bf2c3715SXin Li  *
*bf2c3715SXin Li  */
*bf2c3715SXin Litemplate <typename MatrixType, typename OrderingType>
*bf2c3715SXin Livoid SparseLU<MatrixType, OrderingType>::analyzePattern(const MatrixType& mat)
*bf2c3715SXin Li{
*bf2c3715SXin Li
*bf2c3715SXin Li  //TODO  It is possible as in SuperLU to compute row and columns scaling vectors to equilibrate the matrix mat.
*bf2c3715SXin Li
*bf2c3715SXin Li  // Firstly, copy the whole input matrix.
*bf2c3715SXin Li  m_mat = mat;
*bf2c3715SXin Li
*bf2c3715SXin Li  // Compute fill-in ordering
*bf2c3715SXin Li  OrderingType ord;
*bf2c3715SXin Li  ord(m_mat,m_perm_c);
*bf2c3715SXin Li
*bf2c3715SXin Li  // Apply the permutation to the column of the input  matrix
*bf2c3715SXin Li  if (m_perm_c.size())
*bf2c3715SXin Li  {
*bf2c3715SXin Li    m_mat.uncompress(); //NOTE: The effect of this command is only to create the InnerNonzeros pointers. FIXME : This vector is filled but not subsequently used.
*bf2c3715SXin Li    // Then, permute only the column pointers
*bf2c3715SXin Li    ei_declare_aligned_stack_constructed_variable(StorageIndex,outerIndexPtr,mat.cols()+1,mat.isCompressed()?const_cast<StorageIndex*>(mat.outerIndexPtr()):0);
*bf2c3715SXin Li
*bf2c3715SXin Li    // If the input matrix 'mat' is uncompressed, then the outer-indices do not match the ones of m_mat, and a copy is thus needed.
*bf2c3715SXin Li    if(!mat.isCompressed())
*bf2c3715SXin Li      IndexVector::Map(outerIndexPtr, mat.cols()+1) = IndexVector::Map(m_mat.outerIndexPtr(),mat.cols()+1);
*bf2c3715SXin Li
*bf2c3715SXin Li    // Apply the permutation and compute the nnz per column.
*bf2c3715SXin Li    for (Index i = 0; i < mat.cols(); i++)
*bf2c3715SXin Li    {
*bf2c3715SXin Li      m_mat.outerIndexPtr()[m_perm_c.indices()(i)] = outerIndexPtr[i];
*bf2c3715SXin Li      m_mat.innerNonZeroPtr()[m_perm_c.indices()(i)] = outerIndexPtr[i+1] - outerIndexPtr[i];
*bf2c3715SXin Li    }
*bf2c3715SXin Li  }
*bf2c3715SXin Li
*bf2c3715SXin Li  // Compute the column elimination tree of the permuted matrix
*bf2c3715SXin Li  IndexVector firstRowElt;
*bf2c3715SXin Li  internal::coletree(m_mat, m_etree,firstRowElt);
*bf2c3715SXin Li
*bf2c3715SXin Li  // In symmetric mode, do not do postorder here
*bf2c3715SXin Li  if (!m_symmetricmode) {
*bf2c3715SXin Li    IndexVector post, iwork;
*bf2c3715SXin Li    // Post order etree
*bf2c3715SXin Li    internal::treePostorder(StorageIndex(m_mat.cols()), m_etree, post);
*bf2c3715SXin Li
*bf2c3715SXin Li
*bf2c3715SXin Li    // Renumber etree in postorder
*bf2c3715SXin Li    Index m = m_mat.cols();
*bf2c3715SXin Li    iwork.resize(m+1);
*bf2c3715SXin Li    for (Index i = 0; i < m; ++i) iwork(post(i)) = post(m_etree(i));
*bf2c3715SXin Li    m_etree = iwork;
*bf2c3715SXin Li
*bf2c3715SXin Li    // Postmultiply A*Pc by post, i.e reorder the matrix according to the postorder of the etree
*bf2c3715SXin Li    PermutationType post_perm(m);
*bf2c3715SXin Li    for (Index i = 0; i < m; i++)
*bf2c3715SXin Li      post_perm.indices()(i) = post(i);
*bf2c3715SXin Li
*bf2c3715SXin Li    // Combine the two permutations : postorder the permutation for future use
*bf2c3715SXin Li    if(m_perm_c.size()) {
*bf2c3715SXin Li      m_perm_c = post_perm * m_perm_c;
*bf2c3715SXin Li    }
*bf2c3715SXin Li
*bf2c3715SXin Li  } // end postordering
*bf2c3715SXin Li
*bf2c3715SXin Li  m_analysisIsOk = true;
*bf2c3715SXin Li}
*bf2c3715SXin Li
*bf2c3715SXin Li// Functions needed by the numerical factorization phase
*bf2c3715SXin Li
*bf2c3715SXin Li
*bf2c3715SXin Li/**
*bf2c3715SXin Li  *  - Numerical factorization
*bf2c3715SXin Li  *  - Interleaved with the symbolic factorization
*bf2c3715SXin Li  * On exit,  info is
*bf2c3715SXin Li  *
*bf2c3715SXin Li  *    = 0: successful factorization
*bf2c3715SXin Li  *
*bf2c3715SXin Li  *    > 0: if info = i, and i is
*bf2c3715SXin Li  *
*bf2c3715SXin Li  *       <= A->ncol: U(i,i) is exactly zero. The factorization has
*bf2c3715SXin Li  *          been completed, but the factor U is exactly singular,
*bf2c3715SXin Li  *          and division by zero will occur if it is used to solve a
*bf2c3715SXin Li  *          system of equations.
*bf2c3715SXin Li  *
*bf2c3715SXin Li  *       > A->ncol: number of bytes allocated when memory allocation
*bf2c3715SXin Li  *         failure occurred, plus A->ncol. If lwork = -1, it is
*bf2c3715SXin Li  *         the estimated amount of space needed, plus A->ncol.
*bf2c3715SXin Li  */
*bf2c3715SXin Litemplate <typename MatrixType, typename OrderingType>
*bf2c3715SXin Livoid SparseLU<MatrixType, OrderingType>::factorize(const MatrixType& matrix)
*bf2c3715SXin Li{
*bf2c3715SXin Li  using internal::emptyIdxLU;
*bf2c3715SXin Li  eigen_assert(m_analysisIsOk && "analyzePattern() should be called first");
*bf2c3715SXin Li  eigen_assert((matrix.rows() == matrix.cols()) && "Only for squared matrices");
*bf2c3715SXin Li
*bf2c3715SXin Li  m_isInitialized = true;
*bf2c3715SXin Li
*bf2c3715SXin Li  // Apply the column permutation computed in analyzepattern()
*bf2c3715SXin Li  //   m_mat = matrix * m_perm_c.inverse();
*bf2c3715SXin Li  m_mat = matrix;
*bf2c3715SXin Li  if (m_perm_c.size())
*bf2c3715SXin Li  {
*bf2c3715SXin Li    m_mat.uncompress(); //NOTE: The effect of this command is only to create the InnerNonzeros pointers.
*bf2c3715SXin Li    //Then, permute only the column pointers
*bf2c3715SXin Li    const StorageIndex * outerIndexPtr;
*bf2c3715SXin Li    if (matrix.isCompressed()) outerIndexPtr = matrix.outerIndexPtr();
*bf2c3715SXin Li    else
*bf2c3715SXin Li    {
*bf2c3715SXin Li      StorageIndex* outerIndexPtr_t = new StorageIndex[matrix.cols()+1];
*bf2c3715SXin Li      for(Index i = 0; i <= matrix.cols(); i++) outerIndexPtr_t[i] = m_mat.outerIndexPtr()[i];
*bf2c3715SXin Li      outerIndexPtr = outerIndexPtr_t;
*bf2c3715SXin Li    }
*bf2c3715SXin Li    for (Index i = 0; i < matrix.cols(); i++)
*bf2c3715SXin Li    {
*bf2c3715SXin Li      m_mat.outerIndexPtr()[m_perm_c.indices()(i)] = outerIndexPtr[i];
*bf2c3715SXin Li      m_mat.innerNonZeroPtr()[m_perm_c.indices()(i)] = outerIndexPtr[i+1] - outerIndexPtr[i];
*bf2c3715SXin Li    }
*bf2c3715SXin Li    if(!matrix.isCompressed()) delete[] outerIndexPtr;
*bf2c3715SXin Li  }
*bf2c3715SXin Li  else
*bf2c3715SXin Li  { //FIXME This should not be needed if the empty permutation is handled transparently
*bf2c3715SXin Li    m_perm_c.resize(matrix.cols());
*bf2c3715SXin Li    for(StorageIndex i = 0; i < matrix.cols(); ++i) m_perm_c.indices()(i) = i;
*bf2c3715SXin Li  }
*bf2c3715SXin Li
*bf2c3715SXin Li  Index m = m_mat.rows();
*bf2c3715SXin Li  Index n = m_mat.cols();
*bf2c3715SXin Li  Index nnz = m_mat.nonZeros();
*bf2c3715SXin Li  Index maxpanel = m_perfv.panel_size * m;
*bf2c3715SXin Li  // Allocate working storage common to the factor routines
*bf2c3715SXin Li  Index lwork = 0;
*bf2c3715SXin Li  Index info = Base::memInit(m, n, nnz, lwork, m_perfv.fillfactor, m_perfv.panel_size, m_glu);
*bf2c3715SXin Li  if (info)
*bf2c3715SXin Li  {
*bf2c3715SXin Li    m_lastError = "UNABLE TO ALLOCATE WORKING MEMORY\n\n" ;
*bf2c3715SXin Li    m_factorizationIsOk = false;
*bf2c3715SXin Li    return ;
*bf2c3715SXin Li  }
*bf2c3715SXin Li
*bf2c3715SXin Li  // Set up pointers for integer working arrays
*bf2c3715SXin Li  IndexVector segrep(m); segrep.setZero();
*bf2c3715SXin Li  IndexVector parent(m); parent.setZero();
*bf2c3715SXin Li  IndexVector xplore(m); xplore.setZero();
*bf2c3715SXin Li  IndexVector repfnz(maxpanel);
*bf2c3715SXin Li  IndexVector panel_lsub(maxpanel);
*bf2c3715SXin Li  IndexVector xprune(n); xprune.setZero();
*bf2c3715SXin Li  IndexVector marker(m*internal::LUNoMarker); marker.setZero();
*bf2c3715SXin Li
*bf2c3715SXin Li  repfnz.setConstant(-1);
*bf2c3715SXin Li  panel_lsub.setConstant(-1);
*bf2c3715SXin Li
*bf2c3715SXin Li  // Set up pointers for scalar working arrays
*bf2c3715SXin Li  ScalarVector dense;
*bf2c3715SXin Li  dense.setZero(maxpanel);
*bf2c3715SXin Li  ScalarVector tempv;
*bf2c3715SXin Li  tempv.setZero(internal::LUnumTempV(m, m_perfv.panel_size, m_perfv.maxsuper, /*m_perfv.rowblk*/m) );
*bf2c3715SXin Li
*bf2c3715SXin Li  // Compute the inverse of perm_c
*bf2c3715SXin Li  PermutationType iperm_c(m_perm_c.inverse());
*bf2c3715SXin Li
*bf2c3715SXin Li  // Identify initial relaxed snodes
*bf2c3715SXin Li  IndexVector relax_end(n);
*bf2c3715SXin Li  if ( m_symmetricmode == true )
*bf2c3715SXin Li    Base::heap_relax_snode(n, m_etree, m_perfv.relax, marker, relax_end);
*bf2c3715SXin Li  else
*bf2c3715SXin Li    Base::relax_snode(n, m_etree, m_perfv.relax, marker, relax_end);
*bf2c3715SXin Li
*bf2c3715SXin Li
*bf2c3715SXin Li  m_perm_r.resize(m);
*bf2c3715SXin Li  m_perm_r.indices().setConstant(-1);
*bf2c3715SXin Li  marker.setConstant(-1);
*bf2c3715SXin Li  m_detPermR = 1; // Record the determinant of the row permutation
*bf2c3715SXin Li
*bf2c3715SXin Li  m_glu.supno(0) = emptyIdxLU; m_glu.xsup.setConstant(0);
*bf2c3715SXin Li  m_glu.xsup(0) = m_glu.xlsub(0) = m_glu.xusub(0) = m_glu.xlusup(0) = Index(0);
*bf2c3715SXin Li
*bf2c3715SXin Li  // Work on one 'panel' at a time. A panel is one of the following :
*bf2c3715SXin Li  //  (a) a relaxed supernode at the bottom of the etree, or
*bf2c3715SXin Li  //  (b) panel_size contiguous columns, <panel_size> defined by the user
*bf2c3715SXin Li  Index jcol;
*bf2c3715SXin Li  Index pivrow; // Pivotal row number in the original row matrix
*bf2c3715SXin Li  Index nseg1; // Number of segments in U-column above panel row jcol
*bf2c3715SXin Li  Index nseg; // Number of segments in each U-column
*bf2c3715SXin Li  Index irep;
*bf2c3715SXin Li  Index i, k, jj;
*bf2c3715SXin Li  for (jcol = 0; jcol < n; )
*bf2c3715SXin Li  {
*bf2c3715SXin Li    // Adjust panel size so that a panel won't overlap with the next relaxed snode.
*bf2c3715SXin Li    Index panel_size = m_perfv.panel_size; // upper bound on panel width
*bf2c3715SXin Li    for (k = jcol + 1; k < (std::min)(jcol+panel_size, n); k++)
*bf2c3715SXin Li    {
*bf2c3715SXin Li      if (relax_end(k) != emptyIdxLU)
*bf2c3715SXin Li      {
*bf2c3715SXin Li        panel_size = k - jcol;
*bf2c3715SXin Li        break;
*bf2c3715SXin Li      }
*bf2c3715SXin Li    }
*bf2c3715SXin Li    if (k == n)
*bf2c3715SXin Li      panel_size = n - jcol;
*bf2c3715SXin Li
*bf2c3715SXin Li    // Symbolic outer factorization on a panel of columns
*bf2c3715SXin Li    Base::panel_dfs(m, panel_size, jcol, m_mat, m_perm_r.indices(), nseg1, dense, panel_lsub, segrep, repfnz, xprune, marker, parent, xplore, m_glu);
*bf2c3715SXin Li
*bf2c3715SXin Li    // Numeric sup-panel updates in topological order
*bf2c3715SXin Li    Base::panel_bmod(m, panel_size, jcol, nseg1, dense, tempv, segrep, repfnz, m_glu);
*bf2c3715SXin Li
*bf2c3715SXin Li    // Sparse LU within the panel, and below the panel diagonal
*bf2c3715SXin Li    for ( jj = jcol; jj< jcol + panel_size; jj++)
*bf2c3715SXin Li    {
*bf2c3715SXin Li      k = (jj - jcol) * m; // Column index for w-wide arrays
*bf2c3715SXin Li
*bf2c3715SXin Li      nseg = nseg1; // begin after all the panel segments
*bf2c3715SXin Li      //Depth-first-search for the current column
*bf2c3715SXin Li      VectorBlock<IndexVector> panel_lsubk(panel_lsub, k, m);
*bf2c3715SXin Li      VectorBlock<IndexVector> repfnz_k(repfnz, k, m);
*bf2c3715SXin Li      info = Base::column_dfs(m, jj, m_perm_r.indices(), m_perfv.maxsuper, nseg, panel_lsubk, segrep, repfnz_k, xprune, marker, parent, xplore, m_glu);
*bf2c3715SXin Li      if ( info )
*bf2c3715SXin Li      {
*bf2c3715SXin Li        m_lastError =  "UNABLE TO EXPAND MEMORY IN COLUMN_DFS() ";
*bf2c3715SXin Li        m_info = NumericalIssue;
*bf2c3715SXin Li        m_factorizationIsOk = false;
*bf2c3715SXin Li        return;
*bf2c3715SXin Li      }
*bf2c3715SXin Li      // Numeric updates to this column
*bf2c3715SXin Li      VectorBlock<ScalarVector> dense_k(dense, k, m);
*bf2c3715SXin Li      VectorBlock<IndexVector> segrep_k(segrep, nseg1, m-nseg1);
*bf2c3715SXin Li      info = Base::column_bmod(jj, (nseg - nseg1), dense_k, tempv, segrep_k, repfnz_k, jcol, m_glu);
*bf2c3715SXin Li      if ( info )
*bf2c3715SXin Li      {
*bf2c3715SXin Li        m_lastError = "UNABLE TO EXPAND MEMORY IN COLUMN_BMOD() ";
*bf2c3715SXin Li        m_info = NumericalIssue;
*bf2c3715SXin Li        m_factorizationIsOk = false;
*bf2c3715SXin Li        return;
*bf2c3715SXin Li      }
*bf2c3715SXin Li
*bf2c3715SXin Li      // Copy the U-segments to ucol(*)
*bf2c3715SXin Li      info = Base::copy_to_ucol(jj, nseg, segrep, repfnz_k ,m_perm_r.indices(), dense_k, m_glu);
*bf2c3715SXin Li      if ( info )
*bf2c3715SXin Li      {
*bf2c3715SXin Li        m_lastError = "UNABLE TO EXPAND MEMORY IN COPY_TO_UCOL() ";
*bf2c3715SXin Li        m_info = NumericalIssue;
*bf2c3715SXin Li        m_factorizationIsOk = false;
*bf2c3715SXin Li        return;
*bf2c3715SXin Li      }
*bf2c3715SXin Li
*bf2c3715SXin Li      // Form the L-segment
*bf2c3715SXin Li      info = Base::pivotL(jj, m_diagpivotthresh, m_perm_r.indices(), iperm_c.indices(), pivrow, m_glu);
*bf2c3715SXin Li      if ( info )
*bf2c3715SXin Li      {
*bf2c3715SXin Li        m_lastError = "THE MATRIX IS STRUCTURALLY SINGULAR ... ZERO COLUMN AT ";
*bf2c3715SXin Li        std::ostringstream returnInfo;
*bf2c3715SXin Li        returnInfo << info;
*bf2c3715SXin Li        m_lastError += returnInfo.str();
*bf2c3715SXin Li        m_info = NumericalIssue;
*bf2c3715SXin Li        m_factorizationIsOk = false;
*bf2c3715SXin Li        return;
*bf2c3715SXin Li      }
*bf2c3715SXin Li
*bf2c3715SXin Li      // Update the determinant of the row permutation matrix
*bf2c3715SXin Li      // FIXME: the following test is not correct, we should probably take iperm_c into account and pivrow is not directly the row pivot.
*bf2c3715SXin Li      if (pivrow != jj) m_detPermR = -m_detPermR;
*bf2c3715SXin Li
*bf2c3715SXin Li      // Prune columns (0:jj-1) using column jj
*bf2c3715SXin Li      Base::pruneL(jj, m_perm_r.indices(), pivrow, nseg, segrep, repfnz_k, xprune, m_glu);
*bf2c3715SXin Li
*bf2c3715SXin Li      // Reset repfnz for this column
*bf2c3715SXin Li      for (i = 0; i < nseg; i++)
*bf2c3715SXin Li      {
*bf2c3715SXin Li        irep = segrep(i);
*bf2c3715SXin Li        repfnz_k(irep) = emptyIdxLU;
*bf2c3715SXin Li      }
*bf2c3715SXin Li    } // end SparseLU within the panel
*bf2c3715SXin Li    jcol += panel_size;  // Move to the next panel
*bf2c3715SXin Li  } // end for -- end elimination
*bf2c3715SXin Li
*bf2c3715SXin Li  m_detPermR = m_perm_r.determinant();
*bf2c3715SXin Li  m_detPermC = m_perm_c.determinant();
*bf2c3715SXin Li
*bf2c3715SXin Li  // Count the number of nonzeros in factors
*bf2c3715SXin Li  Base::countnz(n, m_nnzL, m_nnzU, m_glu);
*bf2c3715SXin Li  // Apply permutation  to the L subscripts
*bf2c3715SXin Li  Base::fixupL(n, m_perm_r.indices(), m_glu);
*bf2c3715SXin Li
*bf2c3715SXin Li  // Create supernode matrix L
*bf2c3715SXin Li  m_Lstore.setInfos(m, n, m_glu.lusup, m_glu.xlusup, m_glu.lsub, m_glu.xlsub, m_glu.supno, m_glu.xsup);
*bf2c3715SXin Li  // Create the column major upper sparse matrix  U;
*bf2c3715SXin Li  new (&m_Ustore) MappedSparseMatrix<Scalar, ColMajor, StorageIndex> ( m, n, m_nnzU, m_glu.xusub.data(), m_glu.usub.data(), m_glu.ucol.data() );
*bf2c3715SXin Li
*bf2c3715SXin Li  m_info = Success;
*bf2c3715SXin Li  m_factorizationIsOk = true;
*bf2c3715SXin Li}
*bf2c3715SXin Li
*bf2c3715SXin Litemplate<typename MappedSupernodalType>
*bf2c3715SXin Listruct SparseLUMatrixLReturnType : internal::no_assignment_operator
*bf2c3715SXin Li{
*bf2c3715SXin Li  typedef typename MappedSupernodalType::Scalar Scalar;
*bf2c3715SXin Li  explicit SparseLUMatrixLReturnType(const MappedSupernodalType& mapL) : m_mapL(mapL)
*bf2c3715SXin Li  { }
*bf2c3715SXin Li  Index rows() const { return m_mapL.rows(); }
*bf2c3715SXin Li  Index cols() const { return m_mapL.cols(); }
*bf2c3715SXin Li  template<typename Dest>
*bf2c3715SXin Li  void solveInPlace( MatrixBase<Dest> &X) const
*bf2c3715SXin Li  {
*bf2c3715SXin Li    m_mapL.solveInPlace(X);
*bf2c3715SXin Li  }
*bf2c3715SXin Li  template<bool Conjugate, typename Dest>
*bf2c3715SXin Li  void solveTransposedInPlace( MatrixBase<Dest> &X) const
*bf2c3715SXin Li  {
*bf2c3715SXin Li    m_mapL.template solveTransposedInPlace<Conjugate>(X);
*bf2c3715SXin Li  }
*bf2c3715SXin Li
*bf2c3715SXin Li  const MappedSupernodalType& m_mapL;
*bf2c3715SXin Li};
*bf2c3715SXin Li
*bf2c3715SXin Litemplate<typename MatrixLType, typename MatrixUType>
*bf2c3715SXin Listruct SparseLUMatrixUReturnType : internal::no_assignment_operator
*bf2c3715SXin Li{
*bf2c3715SXin Li  typedef typename MatrixLType::Scalar Scalar;
*bf2c3715SXin Li  SparseLUMatrixUReturnType(const MatrixLType& mapL, const MatrixUType& mapU)
*bf2c3715SXin Li  : m_mapL(mapL),m_mapU(mapU)
*bf2c3715SXin Li  { }
*bf2c3715SXin Li  Index rows() const { return m_mapL.rows(); }
*bf2c3715SXin Li  Index cols() const { return m_mapL.cols(); }
*bf2c3715SXin Li
*bf2c3715SXin Li  template<typename Dest>   void solveInPlace(MatrixBase<Dest> &X) const
*bf2c3715SXin Li  {
*bf2c3715SXin Li    Index nrhs = X.cols();
*bf2c3715SXin Li    Index n    = X.rows();
*bf2c3715SXin Li    // Backward solve with U
*bf2c3715SXin Li    for (Index k = m_mapL.nsuper(); k >= 0; k--)
*bf2c3715SXin Li    {
*bf2c3715SXin Li      Index fsupc = m_mapL.supToCol()[k];
*bf2c3715SXin Li      Index lda = m_mapL.colIndexPtr()[fsupc+1] - m_mapL.colIndexPtr()[fsupc]; // leading dimension
*bf2c3715SXin Li      Index nsupc = m_mapL.supToCol()[k+1] - fsupc;
*bf2c3715SXin Li      Index luptr = m_mapL.colIndexPtr()[fsupc];
*bf2c3715SXin Li
*bf2c3715SXin Li      if (nsupc == 1)
*bf2c3715SXin Li      {
*bf2c3715SXin Li        for (Index j = 0; j < nrhs; j++)
*bf2c3715SXin Li        {
*bf2c3715SXin Li          X(fsupc, j) /= m_mapL.valuePtr()[luptr];
*bf2c3715SXin Li        }
*bf2c3715SXin Li      }
*bf2c3715SXin Li      else
*bf2c3715SXin Li      {
*bf2c3715SXin Li        // FIXME: the following lines should use Block expressions and not Map!
*bf2c3715SXin Li        Map<const Matrix<Scalar,Dynamic,Dynamic, ColMajor>, 0, OuterStride<> > A( &(m_mapL.valuePtr()[luptr]), nsupc, nsupc, OuterStride<>(lda) );
*bf2c3715SXin Li        Map< Matrix<Scalar,Dynamic,Dest::ColsAtCompileTime, ColMajor>, 0, OuterStride<> > U (&(X.coeffRef(fsupc,0)), nsupc, nrhs, OuterStride<>(n) );
*bf2c3715SXin Li        U = A.template triangularView<Upper>().solve(U);
*bf2c3715SXin Li      }
*bf2c3715SXin Li
*bf2c3715SXin Li      for (Index j = 0; j < nrhs; ++j)
*bf2c3715SXin Li      {
*bf2c3715SXin Li        for (Index jcol = fsupc; jcol < fsupc + nsupc; jcol++)
*bf2c3715SXin Li        {
*bf2c3715SXin Li          typename MatrixUType::InnerIterator it(m_mapU, jcol);
*bf2c3715SXin Li          for ( ; it; ++it)
*bf2c3715SXin Li          {
*bf2c3715SXin Li            Index irow = it.index();
*bf2c3715SXin Li            X(irow, j) -= X(jcol, j) * it.value();
*bf2c3715SXin Li          }
*bf2c3715SXin Li        }
*bf2c3715SXin Li      }
*bf2c3715SXin Li    } // End For U-solve
*bf2c3715SXin Li  }
*bf2c3715SXin Li
*bf2c3715SXin Li  template<bool Conjugate, typename Dest>   void solveTransposedInPlace(MatrixBase<Dest> &X) const
*bf2c3715SXin Li  {
*bf2c3715SXin Li    using numext::conj;
*bf2c3715SXin Li    Index nrhs = X.cols();
*bf2c3715SXin Li    Index n    = X.rows();
*bf2c3715SXin Li    // Forward solve with U
*bf2c3715SXin Li    for (Index k = 0; k <=  m_mapL.nsuper(); k++)
*bf2c3715SXin Li    {
*bf2c3715SXin Li      Index fsupc = m_mapL.supToCol()[k];
*bf2c3715SXin Li      Index lda = m_mapL.colIndexPtr()[fsupc+1] - m_mapL.colIndexPtr()[fsupc]; // leading dimension
*bf2c3715SXin Li      Index nsupc = m_mapL.supToCol()[k+1] - fsupc;
*bf2c3715SXin Li      Index luptr = m_mapL.colIndexPtr()[fsupc];
*bf2c3715SXin Li
*bf2c3715SXin Li      for (Index j = 0; j < nrhs; ++j)
*bf2c3715SXin Li      {
*bf2c3715SXin Li        for (Index jcol = fsupc; jcol < fsupc + nsupc; jcol++)
*bf2c3715SXin Li        {
*bf2c3715SXin Li          typename MatrixUType::InnerIterator it(m_mapU, jcol);
*bf2c3715SXin Li          for ( ; it; ++it)
*bf2c3715SXin Li          {
*bf2c3715SXin Li            Index irow = it.index();
*bf2c3715SXin Li            X(jcol, j) -= X(irow, j) * (Conjugate? conj(it.value()): it.value());
*bf2c3715SXin Li          }
*bf2c3715SXin Li        }
*bf2c3715SXin Li      }
*bf2c3715SXin Li      if (nsupc == 1)
*bf2c3715SXin Li      {
*bf2c3715SXin Li        for (Index j = 0; j < nrhs; j++)
*bf2c3715SXin Li        {
*bf2c3715SXin Li          X(fsupc, j) /= (Conjugate? conj(m_mapL.valuePtr()[luptr]) : m_mapL.valuePtr()[luptr]);
*bf2c3715SXin Li        }
*bf2c3715SXin Li      }
*bf2c3715SXin Li      else
*bf2c3715SXin Li      {
*bf2c3715SXin Li        Map<const Matrix<Scalar,Dynamic,Dynamic, ColMajor>, 0, OuterStride<> > A( &(m_mapL.valuePtr()[luptr]), nsupc, nsupc, OuterStride<>(lda) );
*bf2c3715SXin Li        Map< Matrix<Scalar,Dynamic,Dest::ColsAtCompileTime, ColMajor>, 0, OuterStride<> > U (&(X(fsupc,0)), nsupc, nrhs, OuterStride<>(n) );
*bf2c3715SXin Li        if(Conjugate)
*bf2c3715SXin Li          U = A.adjoint().template triangularView<Lower>().solve(U);
*bf2c3715SXin Li        else
*bf2c3715SXin Li          U = A.transpose().template triangularView<Lower>().solve(U);
*bf2c3715SXin Li      }
*bf2c3715SXin Li    }// End For U-solve
*bf2c3715SXin Li  }
*bf2c3715SXin Li
*bf2c3715SXin Li
*bf2c3715SXin Li  const MatrixLType& m_mapL;
*bf2c3715SXin Li  const MatrixUType& m_mapU;
*bf2c3715SXin Li};
*bf2c3715SXin Li
*bf2c3715SXin Li} // End namespace Eigen
*bf2c3715SXin Li
*bf2c3715SXin Li#endif