| // This file is part of Eigen, a lightweight C++ template library | 
 | // for linear algebra. | 
 | // | 
 | // Copyright (C) 2008-2009 Gael Guennebaud <g.gael@free.fr> | 
 | // | 
 | // Eigen is free software; you can redistribute it and/or | 
 | // modify it under the terms of the GNU Lesser General Public | 
 | // License as published by the Free Software Foundation; either | 
 | // version 3 of the License, or (at your option) any later version. | 
 | // | 
 | // Alternatively, you can redistribute it and/or | 
 | // modify it under the terms of the GNU General Public License as | 
 | // published by the Free Software Foundation; either version 2 of | 
 | // the License, or (at your option) any later version. | 
 | // | 
 | // Eigen is distributed in the hope that it will be useful, but WITHOUT ANY | 
 | // WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS | 
 | // FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public License or the | 
 | // GNU General Public License for more details. | 
 | // | 
 | // You should have received a copy of the GNU Lesser General Public | 
 | // License and a copy of the GNU General Public License along with | 
 | // Eigen. If not, see <http://www.gnu.org/licenses/>. | 
 |  | 
 | #ifndef EIGEN_SOLVETRIANGULAR_H | 
 | #define EIGEN_SOLVETRIANGULAR_H | 
 |  | 
 | template<typename Lhs, typename Rhs, int Side> | 
 | class ei_trsolve_traits | 
 | { | 
 |   private: | 
 |     enum { | 
 |       RhsIsVectorAtCompileTime = (Side==OnTheLeft ? Rhs::ColsAtCompileTime : Rhs::RowsAtCompileTime)==1 | 
 |     }; | 
 |   public: | 
 |     enum { | 
 |       Unrolling   = (RhsIsVectorAtCompileTime && Rhs::SizeAtCompileTime != Dynamic && Rhs::SizeAtCompileTime <= 8) | 
 |                   ? CompleteUnrolling : NoUnrolling, | 
 |       RhsVectors  = RhsIsVectorAtCompileTime ? 1 : Dynamic | 
 |     }; | 
 | }; | 
 |  | 
 | template<typename Lhs, typename Rhs, | 
 |   int Side, // can be OnTheLeft/OnTheRight | 
 |   int Mode, // can be Upper/Lower | UnitDiag | 
 |   int Unrolling = ei_trsolve_traits<Lhs,Rhs,Side>::Unrolling, | 
 |   int StorageOrder = (int(Lhs::Flags) & RowMajorBit) ? RowMajor : ColMajor, | 
 |   int RhsVectors = ei_trsolve_traits<Lhs,Rhs,Side>::RhsVectors | 
 |   > | 
 | struct ei_triangular_solver_selector; | 
 |  | 
 | // forward and backward substitution, row-major, rhs is a vector | 
 | template<typename Lhs, typename Rhs, int Mode> | 
 | struct ei_triangular_solver_selector<Lhs,Rhs,OnTheLeft,Mode,NoUnrolling,RowMajor,1> | 
 | { | 
 |   typedef typename Rhs::Scalar Scalar; | 
 |   typedef ei_blas_traits<Lhs> LhsProductTraits; | 
 |   typedef typename LhsProductTraits::ExtractType ActualLhsType; | 
 |   typedef typename Lhs::Index Index; | 
 |   enum { | 
 |     IsLower = ((Mode&Lower)==Lower) | 
 |   }; | 
 |   static void run(const Lhs& lhs, Rhs& other) | 
 |   { | 
 |     static const Index PanelWidth = EIGEN_TUNE_TRIANGULAR_PANEL_WIDTH; | 
 |     ActualLhsType actualLhs = LhsProductTraits::extract(lhs); | 
 |  | 
 |     const Index size = lhs.cols(); | 
 |     for(Index pi=IsLower ? 0 : size; | 
 |         IsLower ? pi<size : pi>0; | 
 |         IsLower ? pi+=PanelWidth : pi-=PanelWidth) | 
 |     { | 
 |       Index actualPanelWidth = std::min(IsLower ? size - pi : pi, PanelWidth); | 
 |  | 
 |       Index r = IsLower ? pi : size - pi; // remaining size | 
 |       if (r > 0) | 
 |       { | 
 |         // let's directly call the low level product function because: | 
 |         // 1 - it is faster to compile | 
 |         // 2 - it is slighlty faster at runtime | 
 |         Index startRow = IsLower ? pi : pi-actualPanelWidth; | 
 |         Index startCol = IsLower ? 0 : pi; | 
 |         VectorBlock<Rhs,Dynamic> target(other,startRow,actualPanelWidth); | 
 |  | 
 |         ei_cache_friendly_product_rowmajor_times_vector<LhsProductTraits::NeedToConjugate,false>( | 
 |           &(actualLhs.const_cast_derived().coeffRef(startRow,startCol)), actualLhs.outerStride(), | 
 |           &(other.coeffRef(startCol)), r, | 
 |           target, Scalar(-1)); | 
 |       } | 
 |  | 
 |       for(Index k=0; k<actualPanelWidth; ++k) | 
 |       { | 
 |         Index i = IsLower ? pi+k : pi-k-1; | 
 |         Index s = IsLower ? pi : i+1; | 
 |         if (k>0) | 
 |           other.coeffRef(i) -= (lhs.row(i).segment(s,k).transpose().cwiseProduct(other.segment(s,k))).sum(); | 
 |  | 
 |         if(!(Mode & UnitDiag)) | 
 |           other.coeffRef(i) /= lhs.coeff(i,i); | 
 |       } | 
 |     } | 
 |   } | 
 | }; | 
 |  | 
 | // forward and backward substitution, column-major, rhs is a vector | 
 | template<typename Lhs, typename Rhs, int Mode> | 
 | struct ei_triangular_solver_selector<Lhs,Rhs,OnTheLeft,Mode,NoUnrolling,ColMajor,1> | 
 | { | 
 |   typedef typename Rhs::Scalar Scalar; | 
 |   typedef typename ei_packet_traits<Scalar>::type Packet; | 
 |   typedef ei_blas_traits<Lhs> LhsProductTraits; | 
 |   typedef typename LhsProductTraits::ExtractType ActualLhsType; | 
 |   typedef typename Lhs::Index Index; | 
 |   enum { | 
 |     PacketSize =  ei_packet_traits<Scalar>::size, | 
 |     IsLower = ((Mode&Lower)==Lower) | 
 |   }; | 
 |  | 
 |   static void run(const Lhs& lhs, Rhs& other) | 
 |   { | 
 |     static const Index PanelWidth = EIGEN_TUNE_TRIANGULAR_PANEL_WIDTH; | 
 |     ActualLhsType actualLhs = LhsProductTraits::extract(lhs); | 
 |  | 
 |     const Index size = lhs.cols(); | 
 |     for(Index pi=IsLower ? 0 : size; | 
 |         IsLower ? pi<size : pi>0; | 
 |         IsLower ? pi+=PanelWidth : pi-=PanelWidth) | 
 |     { | 
 |       Index actualPanelWidth = std::min(IsLower ? size - pi : pi, PanelWidth); | 
 |       Index startBlock = IsLower ? pi : pi-actualPanelWidth; | 
 |       Index endBlock = IsLower ? pi + actualPanelWidth : 0; | 
 |  | 
 |       for(Index k=0; k<actualPanelWidth; ++k) | 
 |       { | 
 |         Index i = IsLower ? pi+k : pi-k-1; | 
 |         if(!(Mode & UnitDiag)) | 
 |           other.coeffRef(i) /= lhs.coeff(i,i); | 
 |  | 
 |         Index r = actualPanelWidth - k - 1; // remaining size | 
 |         Index s = IsLower ? i+1 : i-r; | 
 |         if (r>0) | 
 |           other.segment(s,r) -= other.coeffRef(i) * Block<Lhs,Dynamic,1>(lhs, s, i, r, 1); | 
 |       } | 
 |       Index r = IsLower ? size - endBlock : startBlock; // remaining size | 
 |       if (r > 0) | 
 |       { | 
 |         // let's directly call the low level product function because: | 
 |         // 1 - it is faster to compile | 
 |         // 2 - it is slighlty faster at runtime | 
 |         ei_cache_friendly_product_colmajor_times_vector<LhsProductTraits::NeedToConjugate,false>( | 
 |           r, | 
 |           &(actualLhs.const_cast_derived().coeffRef(endBlock,startBlock)), actualLhs.outerStride(), | 
 |           other.segment(startBlock, actualPanelWidth), | 
 |           &(other.coeffRef(endBlock, 0)), | 
 |           Scalar(-1)); | 
 |       } | 
 |     } | 
 |   } | 
 | }; | 
 |  | 
 | // transpose OnTheRight cases for vectors | 
 | template<typename Lhs, typename Rhs, int Mode, int Unrolling, int StorageOrder> | 
 | struct ei_triangular_solver_selector<Lhs,Rhs,OnTheRight,Mode,Unrolling,StorageOrder,1> | 
 | { | 
 |   static void run(const Lhs& lhs, Rhs& rhs) | 
 |   { | 
 |     Transpose<Rhs> rhsTr(rhs); | 
 |     Transpose<Lhs> lhsTr(lhs); | 
 |     ei_triangular_solver_selector<Transpose<Lhs>,Transpose<Rhs>,OnTheLeft,TriangularView<Lhs,Mode>::TransposeMode>::run(lhsTr,rhsTr); | 
 |   } | 
 | }; | 
 |  | 
 | template <typename Scalar, typename Index, int Side, int Mode, bool Conjugate, int TriStorageOrder, int OtherStorageOrder> | 
 | struct ei_triangular_solve_matrix; | 
 |  | 
 | // the rhs is a matrix | 
 | template<typename Lhs, typename Rhs, int Side, int Mode, int StorageOrder> | 
 | struct ei_triangular_solver_selector<Lhs,Rhs,Side,Mode,NoUnrolling,StorageOrder,Dynamic> | 
 | { | 
 |   typedef typename Rhs::Scalar Scalar; | 
 |   typedef typename Rhs::Index Index; | 
 |   typedef ei_blas_traits<Lhs> LhsProductTraits; | 
 |   typedef typename LhsProductTraits::DirectLinearAccessType ActualLhsType; | 
 |   static void run(const Lhs& lhs, Rhs& rhs) | 
 |   { | 
 |     const ActualLhsType actualLhs = LhsProductTraits::extract(lhs); | 
 |     ei_triangular_solve_matrix<Scalar,Index,Side,Mode,LhsProductTraits::NeedToConjugate,StorageOrder, | 
 |                                (Rhs::Flags&RowMajorBit) ? RowMajor : ColMajor> | 
 |       ::run(lhs.rows(), Side==OnTheLeft? rhs.cols() : rhs.rows(), &actualLhs.coeff(0,0), actualLhs.outerStride(), &rhs.coeffRef(0,0), rhs.outerStride()); | 
 |   } | 
 | }; | 
 |  | 
 | /*************************************************************************** | 
 | * meta-unrolling implementation | 
 | ***************************************************************************/ | 
 |  | 
 | template<typename Lhs, typename Rhs, int Mode, int Index, int Size, | 
 |          bool Stop = Index==Size> | 
 | struct ei_triangular_solver_unroller; | 
 |  | 
 | template<typename Lhs, typename Rhs, int Mode, int Index, int Size> | 
 | struct ei_triangular_solver_unroller<Lhs,Rhs,Mode,Index,Size,false> { | 
 |   enum { | 
 |     IsLower = ((Mode&Lower)==Lower), | 
 |     I = IsLower ? Index : Size - Index - 1, | 
 |     S = IsLower ? 0     : I+1 | 
 |   }; | 
 |   static void run(const Lhs& lhs, Rhs& rhs) | 
 |   { | 
 |     if (Index>0) | 
 |       rhs.coeffRef(I) -= lhs.row(I).template segment<Index>(S).transpose().cwiseProduct(rhs.template segment<Index>(S)).sum(); | 
 |  | 
 |     if(!(Mode & UnitDiag)) | 
 |       rhs.coeffRef(I) /= lhs.coeff(I,I); | 
 |  | 
 |     ei_triangular_solver_unroller<Lhs,Rhs,Mode,Index+1,Size>::run(lhs,rhs); | 
 |   } | 
 | }; | 
 |  | 
 | template<typename Lhs, typename Rhs, int Mode, int Index, int Size> | 
 | struct ei_triangular_solver_unroller<Lhs,Rhs,Mode,Index,Size,true> { | 
 |   static void run(const Lhs&, Rhs&) {} | 
 | }; | 
 |  | 
 | template<typename Lhs, typename Rhs, int Mode, int StorageOrder> | 
 | struct ei_triangular_solver_selector<Lhs,Rhs,OnTheLeft,Mode,CompleteUnrolling,StorageOrder,1> { | 
 |   static void run(const Lhs& lhs, Rhs& rhs) | 
 |   { ei_triangular_solver_unroller<Lhs,Rhs,Mode,0,Rhs::SizeAtCompileTime>::run(lhs,rhs); } | 
 | }; | 
 |  | 
 | /*************************************************************************** | 
 | * TriangularView methods | 
 | ***************************************************************************/ | 
 |  | 
 | /** "in-place" version of TriangularView::solve() where the result is written in \a other | 
 |   * | 
 |   * \nonstableyet | 
 |   * | 
 |   * \warning The parameter is only marked 'const' to make the C++ compiler accept a temporary expression here. | 
 |   * This function will const_cast it, so constness isn't honored here. | 
 |   * | 
 |   * See TriangularView:solve() for the details. | 
 |   */ | 
 | template<typename MatrixType, unsigned int Mode> | 
 | template<int Side, typename OtherDerived> | 
 | void TriangularView<MatrixType,Mode>::solveInPlace(const MatrixBase<OtherDerived>& _other) const | 
 | { | 
 |   OtherDerived& other = _other.const_cast_derived(); | 
 |   ei_assert(cols() == rows()); | 
 |   ei_assert( (Side==OnTheLeft && cols() == other.rows()) || (Side==OnTheRight && cols() == other.cols()) ); | 
 |   ei_assert(!(Mode & ZeroDiag)); | 
 |   ei_assert(Mode & (Upper|Lower)); | 
 |  | 
 |   enum { copy = ei_traits<OtherDerived>::Flags & RowMajorBit  && OtherDerived::IsVectorAtCompileTime }; | 
 |   typedef typename ei_meta_if<copy, | 
 |     typename ei_plain_matrix_type_column_major<OtherDerived>::type, OtherDerived&>::ret OtherCopy; | 
 |   OtherCopy otherCopy(other); | 
 |  | 
 |   ei_triangular_solver_selector<MatrixType, typename ei_unref<OtherCopy>::type, | 
 |     Side, Mode>::run(nestedExpression(), otherCopy); | 
 |  | 
 |   if (copy) | 
 |     other = otherCopy; | 
 | } | 
 |  | 
 | /** \returns the product of the inverse of \c *this with \a other, \a *this being triangular. | 
 |   * | 
 |   * \nonstableyet | 
 |   * | 
 |   * This function computes the inverse-matrix matrix product inverse(\c *this) * \a other. | 
 |   * The matrix \c *this must be triangular and invertible (i.e., all the coefficients of the | 
 |   * diagonal must be non zero). It works as a forward (resp. backward) substitution if \c *this | 
 |   * is an upper (resp. lower) triangular matrix. | 
 |   * | 
 |   * It is required that \c *this be marked as either an upper or a lower triangular matrix, which | 
 |   * can be done by marked(), and that is automatically the case with expressions such as those returned | 
 |   * by extract(). | 
 |   * | 
 |   * Example: \include MatrixBase_marked.cpp | 
 |   * Output: \verbinclude MatrixBase_marked.out | 
 |   * | 
 |   * This function is essentially a wrapper to the faster solveTriangularInPlace() function creating | 
 |   * a temporary copy of \a other, calling solveTriangularInPlace() on the copy and returning it. | 
 |   * Therefore, if \a other is not needed anymore, it is quite faster to call solveTriangularInPlace() | 
 |   * instead of solveTriangular(). | 
 |   * | 
 |   * For users coming from BLAS, this function (and more specifically solveTriangularInPlace()) offer | 
 |   * all the operations supported by the \c *TRSV and \c *TRSM BLAS routines. | 
 |   * | 
 |   * \b Tips: to perform a \em "right-inverse-multiply" you can simply transpose the operation, e.g.: | 
 |   * \code | 
 |   * M * T^1  <=>  T.transpose().solveInPlace(M.transpose()); | 
 |   * \endcode | 
 |   * | 
 |   * \sa TriangularView::solveInPlace() | 
 |   */ | 
 | template<typename Derived, unsigned int Mode> | 
 | template<int Side, typename RhsDerived> | 
 | typename ei_plain_matrix_type_column_major<RhsDerived>::type | 
 | TriangularView<Derived,Mode>::solve(const MatrixBase<RhsDerived>& rhs) const | 
 | { | 
 |   typename ei_plain_matrix_type_column_major<RhsDerived>::type res(rhs); | 
 |   solveInPlace<Side>(res); | 
 |   return res; | 
 | } | 
 |  | 
 | #endif // EIGEN_SOLVETRIANGULAR_H |