| // This file is part of Eigen, a lightweight C++ template library | 
 | // for linear algebra. | 
 | // | 
 | // Copyright (C) 2008-2009 Gael Guennebaud <gael.guennebaud@inria.fr> | 
 | // | 
 | // This Source Code Form is subject to the terms of the Mozilla | 
 | // Public License v. 2.0. If a copy of the MPL was not distributed | 
 | // with this file, You can obtain one at http://mozilla.org/MPL/2.0/. | 
 |  | 
 | #ifndef EIGEN_SOLVETRIANGULAR_H | 
 | #define EIGEN_SOLVETRIANGULAR_H | 
 |  | 
 | // IWYU pragma: private | 
 | #include "./InternalHeaderCheck.h" | 
 |  | 
 | namespace Eigen { | 
 |  | 
 | namespace internal { | 
 |  | 
 | // Forward declarations: | 
 | // The following two routines are implemented in the products/TriangularSolver*.h files | 
 | template <typename LhsScalar, typename RhsScalar, typename Index, int Side, int Mode, bool Conjugate, int StorageOrder> | 
 | struct triangular_solve_vector; | 
 |  | 
 | template <typename Scalar, typename Index, int Side, int Mode, bool Conjugate, int TriStorageOrder, | 
 |           int OtherStorageOrder, int OtherInnerStride> | 
 | struct triangular_solve_matrix; | 
 |  | 
 | // small helper struct extracting some traits on the underlying solver operation | 
 | template <typename Lhs, typename Rhs, int Side> | 
 | class trsolve_traits { | 
 |  private: | 
 |   enum { RhsIsVectorAtCompileTime = (Side == OnTheLeft ? Rhs::ColsAtCompileTime : Rhs::RowsAtCompileTime) == 1 }; | 
 |  | 
 |  public: | 
 |   enum { | 
 |     Unrolling = (RhsIsVectorAtCompileTime && Rhs::SizeAtCompileTime != Dynamic && Rhs::SizeAtCompileTime <= 8) | 
 |                     ? CompleteUnrolling | 
 |                     : NoUnrolling, | 
 |     RhsVectors = RhsIsVectorAtCompileTime ? 1 : Dynamic | 
 |   }; | 
 | }; | 
 |  | 
 | template <typename Lhs, typename Rhs, | 
 |           int Side,  // can be OnTheLeft/OnTheRight | 
 |           int Mode,  // can be Upper/Lower | UnitDiag | 
 |           int Unrolling = trsolve_traits<Lhs, Rhs, Side>::Unrolling, | 
 |           int RhsVectors = trsolve_traits<Lhs, Rhs, Side>::RhsVectors> | 
 | struct triangular_solver_selector; | 
 |  | 
 | template <typename Lhs, typename Rhs, int Side, int Mode> | 
 | struct triangular_solver_selector<Lhs, Rhs, Side, Mode, NoUnrolling, 1> { | 
 |   typedef typename Lhs::Scalar LhsScalar; | 
 |   typedef typename Rhs::Scalar RhsScalar; | 
 |   typedef blas_traits<Lhs> LhsProductTraits; | 
 |   typedef typename LhsProductTraits::ExtractType ActualLhsType; | 
 |   typedef Map<Matrix<RhsScalar, Dynamic, 1>, Aligned> MappedRhs; | 
 |   static EIGEN_DEVICE_FUNC void run(const Lhs& lhs, Rhs& rhs) { | 
 |     ActualLhsType actualLhs = LhsProductTraits::extract(lhs); | 
 |  | 
 |     // FIXME find a way to allow an inner stride if packet_traits<Scalar>::size==1 | 
 |  | 
 |     bool useRhsDirectly = Rhs::InnerStrideAtCompileTime == 1 || rhs.innerStride() == 1; | 
 |  | 
 |     ei_declare_aligned_stack_constructed_variable(RhsScalar, actualRhs, rhs.size(), (useRhsDirectly ? rhs.data() : 0)); | 
 |  | 
 |     if (!useRhsDirectly) MappedRhs(actualRhs, rhs.size()) = rhs; | 
 |  | 
 |     triangular_solve_vector<LhsScalar, RhsScalar, Index, Side, Mode, LhsProductTraits::NeedToConjugate, | 
 |                             (int(Lhs::Flags) & RowMajorBit) ? RowMajor : ColMajor>::run(actualLhs.cols(), | 
 |                                                                                         actualLhs.data(), | 
 |                                                                                         actualLhs.outerStride(), | 
 |                                                                                         actualRhs); | 
 |  | 
 |     if (!useRhsDirectly) rhs = MappedRhs(actualRhs, rhs.size()); | 
 |   } | 
 | }; | 
 |  | 
 | // the rhs is a matrix | 
 | template <typename Lhs, typename Rhs, int Side, int Mode> | 
 | struct triangular_solver_selector<Lhs, Rhs, Side, Mode, NoUnrolling, Dynamic> { | 
 |   typedef typename Rhs::Scalar Scalar; | 
 |   typedef blas_traits<Lhs> LhsProductTraits; | 
 |   typedef typename LhsProductTraits::DirectLinearAccessType ActualLhsType; | 
 |  | 
 |   static EIGEN_DEVICE_FUNC void run(const Lhs& lhs, Rhs& rhs) { | 
 |     add_const_on_value_type_t<ActualLhsType> actualLhs = LhsProductTraits::extract(lhs); | 
 |  | 
 |     const Index size = lhs.rows(); | 
 |     const Index othersize = Side == OnTheLeft ? rhs.cols() : rhs.rows(); | 
 |  | 
 |     typedef internal::gemm_blocking_space<(Rhs::Flags & RowMajorBit) ? RowMajor : ColMajor, Scalar, Scalar, | 
 |                                           Rhs::MaxRowsAtCompileTime, Rhs::MaxColsAtCompileTime, | 
 |                                           Lhs::MaxRowsAtCompileTime, 4> | 
 |         BlockingType; | 
 |  | 
 |     // Nothing to solve. | 
 |     if (actualLhs.size() == 0 || rhs.size() == 0) { | 
 |       return; | 
 |     } | 
 |  | 
 |     BlockingType blocking(rhs.rows(), rhs.cols(), size, 1, false); | 
 |  | 
 |     triangular_solve_matrix<Scalar, Index, Side, Mode, LhsProductTraits::NeedToConjugate, | 
 |                             (int(Lhs::Flags) & RowMajorBit) ? RowMajor : ColMajor, | 
 |                             (Rhs::Flags & RowMajorBit) ? RowMajor : ColMajor, | 
 |                             Rhs::InnerStrideAtCompileTime>::run(size, othersize, &actualLhs.coeffRef(0, 0), | 
 |                                                                 actualLhs.outerStride(), &rhs.coeffRef(0, 0), | 
 |                                                                 rhs.innerStride(), rhs.outerStride(), blocking); | 
 |   } | 
 | }; | 
 |  | 
 | /*************************************************************************** | 
 |  * meta-unrolling implementation | 
 |  ***************************************************************************/ | 
 |  | 
 | template <typename Lhs, typename Rhs, int Mode, int LoopIndex, int Size, bool Stop = LoopIndex == Size> | 
 | struct triangular_solver_unroller; | 
 |  | 
 | template <typename Lhs, typename Rhs, int Mode, int LoopIndex, int Size> | 
 | struct triangular_solver_unroller<Lhs, Rhs, Mode, LoopIndex, Size, false> { | 
 |   enum { | 
 |     IsLower = ((Mode & Lower) == Lower), | 
 |     DiagIndex = IsLower ? LoopIndex : Size - LoopIndex - 1, | 
 |     StartIndex = IsLower ? 0 : DiagIndex + 1 | 
 |   }; | 
 |   static EIGEN_DEVICE_FUNC void run(const Lhs& lhs, Rhs& rhs) { | 
 |     if (LoopIndex > 0) | 
 |       rhs.coeffRef(DiagIndex) -= lhs.row(DiagIndex) | 
 |                                      .template segment<LoopIndex>(StartIndex) | 
 |                                      .transpose() | 
 |                                      .cwiseProduct(rhs.template segment<LoopIndex>(StartIndex)) | 
 |                                      .sum(); | 
 |  | 
 |     if (!(Mode & UnitDiag)) rhs.coeffRef(DiagIndex) /= lhs.coeff(DiagIndex, DiagIndex); | 
 |  | 
 |     triangular_solver_unroller<Lhs, Rhs, Mode, LoopIndex + 1, Size>::run(lhs, rhs); | 
 |   } | 
 | }; | 
 |  | 
 | template <typename Lhs, typename Rhs, int Mode, int LoopIndex, int Size> | 
 | struct triangular_solver_unroller<Lhs, Rhs, Mode, LoopIndex, Size, true> { | 
 |   static EIGEN_DEVICE_FUNC void run(const Lhs&, Rhs&) {} | 
 | }; | 
 |  | 
 | template <typename Lhs, typename Rhs, int Mode> | 
 | struct triangular_solver_selector<Lhs, Rhs, OnTheLeft, Mode, CompleteUnrolling, 1> { | 
 |   static EIGEN_DEVICE_FUNC void run(const Lhs& lhs, Rhs& rhs) { | 
 |     triangular_solver_unroller<Lhs, Rhs, Mode, 0, Rhs::SizeAtCompileTime>::run(lhs, rhs); | 
 |   } | 
 | }; | 
 |  | 
 | template <typename Lhs, typename Rhs, int Mode> | 
 | struct triangular_solver_selector<Lhs, Rhs, OnTheRight, Mode, CompleteUnrolling, 1> { | 
 |   static EIGEN_DEVICE_FUNC void run(const Lhs& lhs, Rhs& rhs) { | 
 |     Transpose<const Lhs> trLhs(lhs); | 
 |     Transpose<Rhs> trRhs(rhs); | 
 |  | 
 |     triangular_solver_unroller<Transpose<const Lhs>, Transpose<Rhs>, | 
 |                                ((Mode & Upper) == Upper ? Lower : Upper) | (Mode & UnitDiag), 0, | 
 |                                Rhs::SizeAtCompileTime>::run(trLhs, trRhs); | 
 |   } | 
 | }; | 
 |  | 
 | }  // end namespace internal | 
 |  | 
 | /*************************************************************************** | 
 |  * TriangularView methods | 
 |  ***************************************************************************/ | 
 |  | 
 | #ifndef EIGEN_PARSED_BY_DOXYGEN | 
 | template <typename MatrixType, unsigned int Mode> | 
 | template <int Side, typename OtherDerived> | 
 | EIGEN_DEVICE_FUNC void TriangularViewImpl<MatrixType, Mode, Dense>::solveInPlace( | 
 |     const MatrixBase<OtherDerived>& _other) const { | 
 |   OtherDerived& other = _other.const_cast_derived(); | 
 |   eigen_assert(derived().cols() == derived().rows() && ((Side == OnTheLeft && derived().cols() == other.rows()) || | 
 |                                                         (Side == OnTheRight && derived().cols() == other.cols()))); | 
 |   eigen_assert((!(int(Mode) & int(ZeroDiag))) && bool(int(Mode) & (int(Upper) | int(Lower)))); | 
 |   // If solving for a 0x0 matrix, nothing to do, simply return. | 
 |   if (derived().cols() == 0) return; | 
 |  | 
 |   enum { | 
 |     copy = (internal::traits<OtherDerived>::Flags & RowMajorBit) && OtherDerived::IsVectorAtCompileTime && | 
 |            OtherDerived::SizeAtCompileTime != 1 | 
 |   }; | 
 |   typedef std::conditional_t<copy, typename internal::plain_matrix_type_column_major<OtherDerived>::type, OtherDerived&> | 
 |       OtherCopy; | 
 |   OtherCopy otherCopy(other); | 
 |  | 
 |   internal::triangular_solver_selector<MatrixType, std::remove_reference_t<OtherCopy>, Side, Mode>::run( | 
 |       derived().nestedExpression(), otherCopy); | 
 |  | 
 |   if (copy) other = otherCopy; | 
 | } | 
 |  | 
 | template <typename Derived, unsigned int Mode> | 
 | template <int Side, typename Other> | 
 | const internal::triangular_solve_retval<Side, TriangularView<Derived, Mode>, Other> | 
 | TriangularViewImpl<Derived, Mode, Dense>::solve(const MatrixBase<Other>& other) const { | 
 |   return internal::triangular_solve_retval<Side, TriangularViewType, Other>(derived(), other.derived()); | 
 | } | 
 | #endif | 
 |  | 
 | namespace internal { | 
 |  | 
 | template <int Side, typename TriangularType, typename Rhs> | 
 | struct traits<triangular_solve_retval<Side, TriangularType, Rhs> > { | 
 |   typedef typename internal::plain_matrix_type_column_major<Rhs>::type ReturnType; | 
 | }; | 
 |  | 
 | template <int Side, typename TriangularType, typename Rhs> | 
 | struct triangular_solve_retval : public ReturnByValue<triangular_solve_retval<Side, TriangularType, Rhs> > { | 
 |   typedef remove_all_t<typename Rhs::Nested> RhsNestedCleaned; | 
 |   typedef ReturnByValue<triangular_solve_retval> Base; | 
 |  | 
 |   triangular_solve_retval(const TriangularType& tri, const Rhs& rhs) : m_triangularMatrix(tri), m_rhs(rhs) {} | 
 |  | 
 |   inline EIGEN_CONSTEXPR Index rows() const EIGEN_NOEXCEPT { return m_rhs.rows(); } | 
 |   inline EIGEN_CONSTEXPR Index cols() const EIGEN_NOEXCEPT { return m_rhs.cols(); } | 
 |  | 
 |   template <typename Dest> | 
 |   inline void evalTo(Dest& dst) const { | 
 |     if (!is_same_dense(dst, m_rhs)) dst = m_rhs; | 
 |     m_triangularMatrix.template solveInPlace<Side>(dst); | 
 |   } | 
 |  | 
 |  protected: | 
 |   const TriangularType& m_triangularMatrix; | 
 |   typename Rhs::Nested m_rhs; | 
 | }; | 
 |  | 
 | }  // namespace internal | 
 |  | 
 | }  // end namespace Eigen | 
 |  | 
 | #endif  // EIGEN_SOLVETRIANGULAR_H |