1 // This file is part of Eigen, a lightweight C++ template library 2 // for linear algebra. 3 // 4 // Copyright (C) 2008-2009 Gael Guennebaud <gael.guennebaud@inria.fr> 5 // 6 // This Source Code Form is subject to the terms of the Mozilla 7 // Public License v. 2.0. If a copy of the MPL was not distributed 8 // with this file, You can obtain one at http://mozilla.org/MPL/2.0/. 9 10 #ifndef EIGEN_SOLVETRIANGULAR_H 11 #define EIGEN_SOLVETRIANGULAR_H 12 13 namespace Eigen { 14 15 namespace internal { 16 17 // Forward declarations: 18 // The following two routines are implemented in the products/TriangularSolver*.h files 19 template<typename LhsScalar, typename RhsScalar, typename Index, int Side, int Mode, bool Conjugate, int StorageOrder> 20 struct triangular_solve_vector; 21 22 template <typename Scalar, typename Index, int Side, int Mode, bool Conjugate, int TriStorageOrder, int OtherStorageOrder, int OtherInnerStride> 23 struct triangular_solve_matrix; 24 25 // small helper struct extracting some traits on the underlying solver operation 26 template<typename Lhs, typename Rhs, int Side> 27 class trsolve_traits 28 { 29 private: 30 enum { 31 RhsIsVectorAtCompileTime = (Side==OnTheLeft ? Rhs::ColsAtCompileTime : Rhs::RowsAtCompileTime)==1 32 }; 33 public: 34 enum { 35 Unrolling = (RhsIsVectorAtCompileTime && Rhs::SizeAtCompileTime != Dynamic && Rhs::SizeAtCompileTime <= 8) 36 ? CompleteUnrolling : NoUnrolling, 37 RhsVectors = RhsIsVectorAtCompileTime ? 1 : Dynamic 38 }; 39 }; 40 41 template<typename Lhs, typename Rhs, 42 int Side, // can be OnTheLeft/OnTheRight 43 int Mode, // can be Upper/Lower | UnitDiag 44 int Unrolling = trsolve_traits<Lhs,Rhs,Side>::Unrolling, 45 int RhsVectors = trsolve_traits<Lhs,Rhs,Side>::RhsVectors 46 > 47 struct triangular_solver_selector; 48 49 template<typename Lhs, typename Rhs, int Side, int Mode> 50 struct triangular_solver_selector<Lhs,Rhs,Side,Mode,NoUnrolling,1> 51 { 52 typedef typename Lhs::Scalar LhsScalar; 53 typedef typename Rhs::Scalar RhsScalar; 54 typedef blas_traits<Lhs> LhsProductTraits; 55 typedef typename LhsProductTraits::ExtractType ActualLhsType; 56 typedef Map<Matrix<RhsScalar,Dynamic,1>, Aligned> MappedRhs; 57 static EIGEN_DEVICE_FUNC void run(const Lhs& lhs, Rhs& rhs) 58 { 59 ActualLhsType actualLhs = LhsProductTraits::extract(lhs); 60 61 // FIXME find a way to allow an inner stride if packet_traits<Scalar>::size==1 62 63 bool useRhsDirectly = Rhs::InnerStrideAtCompileTime==1 || rhs.innerStride()==1; 64 65 ei_declare_aligned_stack_constructed_variable(RhsScalar,actualRhs,rhs.size(), 66 (useRhsDirectly ? rhs.data() : 0)); 67 68 if(!useRhsDirectly) 69 MappedRhs(actualRhs,rhs.size()) = rhs; 70 71 triangular_solve_vector<LhsScalar, RhsScalar, Index, Side, Mode, LhsProductTraits::NeedToConjugate, 72 (int(Lhs::Flags) & RowMajorBit) ? RowMajor : ColMajor> 73 ::run(actualLhs.cols(), actualLhs.data(), actualLhs.outerStride(), actualRhs); 74 75 if(!useRhsDirectly) 76 rhs = MappedRhs(actualRhs, rhs.size()); 77 } 78 }; 79 80 // the rhs is a matrix 81 template<typename Lhs, typename Rhs, int Side, int Mode> 82 struct triangular_solver_selector<Lhs,Rhs,Side,Mode,NoUnrolling,Dynamic> 83 { 84 typedef typename Rhs::Scalar Scalar; 85 typedef blas_traits<Lhs> LhsProductTraits; 86 typedef typename LhsProductTraits::DirectLinearAccessType ActualLhsType; 87 88 static EIGEN_DEVICE_FUNC void run(const Lhs& lhs, Rhs& rhs) 89 { 90 typename internal::add_const_on_value_type<ActualLhsType>::type actualLhs = LhsProductTraits::extract(lhs); 91 92 const Index size = lhs.rows(); 93 const Index othersize = Side==OnTheLeft? rhs.cols() : rhs.rows(); 94 95 typedef internal::gemm_blocking_space<(Rhs::Flags&RowMajorBit) ? RowMajor : ColMajor,Scalar,Scalar, 96 Rhs::MaxRowsAtCompileTime, Rhs::MaxColsAtCompileTime, Lhs::MaxRowsAtCompileTime,4> BlockingType; 97 98 BlockingType blocking(rhs.rows(), rhs.cols(), size, 1, false); 99 100 triangular_solve_matrix<Scalar,Index,Side,Mode,LhsProductTraits::NeedToConjugate,(int(Lhs::Flags) & RowMajorBit) ? RowMajor : ColMajor, 101 (Rhs::Flags&RowMajorBit) ? RowMajor : ColMajor, Rhs::InnerStrideAtCompileTime> 102 ::run(size, othersize, &actualLhs.coeffRef(0,0), actualLhs.outerStride(), &rhs.coeffRef(0,0), rhs.innerStride(), rhs.outerStride(), blocking); 103 } 104 }; 105 106 /*************************************************************************** 107 * meta-unrolling implementation 108 ***************************************************************************/ 109 110 template<typename Lhs, typename Rhs, int Mode, int LoopIndex, int Size, 111 bool Stop = LoopIndex==Size> 112 struct triangular_solver_unroller; 113 114 template<typename Lhs, typename Rhs, int Mode, int LoopIndex, int Size> 115 struct triangular_solver_unroller<Lhs,Rhs,Mode,LoopIndex,Size,false> { 116 enum { 117 IsLower = ((Mode&Lower)==Lower), 118 DiagIndex = IsLower ? LoopIndex : Size - LoopIndex - 1, 119 StartIndex = IsLower ? 0 : DiagIndex+1 120 }; 121 static EIGEN_DEVICE_FUNC void run(const Lhs& lhs, Rhs& rhs) 122 { 123 if (LoopIndex>0) 124 rhs.coeffRef(DiagIndex) -= lhs.row(DiagIndex).template segment<LoopIndex>(StartIndex).transpose() 125 .cwiseProduct(rhs.template segment<LoopIndex>(StartIndex)).sum(); 126 127 if(!(Mode & UnitDiag)) 128 rhs.coeffRef(DiagIndex) /= lhs.coeff(DiagIndex,DiagIndex); 129 130 triangular_solver_unroller<Lhs,Rhs,Mode,LoopIndex+1,Size>::run(lhs,rhs); 131 } 132 }; 133 134 template<typename Lhs, typename Rhs, int Mode, int LoopIndex, int Size> 135 struct triangular_solver_unroller<Lhs,Rhs,Mode,LoopIndex,Size,true> { 136 static EIGEN_DEVICE_FUNC void run(const Lhs&, Rhs&) {} 137 }; 138 139 template<typename Lhs, typename Rhs, int Mode> 140 struct triangular_solver_selector<Lhs,Rhs,OnTheLeft,Mode,CompleteUnrolling,1> { 141 static EIGEN_DEVICE_FUNC void run(const Lhs& lhs, Rhs& rhs) 142 { triangular_solver_unroller<Lhs,Rhs,Mode,0,Rhs::SizeAtCompileTime>::run(lhs,rhs); } 143 }; 144 145 template<typename Lhs, typename Rhs, int Mode> 146 struct triangular_solver_selector<Lhs,Rhs,OnTheRight,Mode,CompleteUnrolling,1> { 147 static EIGEN_DEVICE_FUNC void run(const Lhs& lhs, Rhs& rhs) 148 { 149 Transpose<const Lhs> trLhs(lhs); 150 Transpose<Rhs> trRhs(rhs); 151 152 triangular_solver_unroller<Transpose<const Lhs>,Transpose<Rhs>, 153 ((Mode&Upper)==Upper ? Lower : Upper) | (Mode&UnitDiag), 154 0,Rhs::SizeAtCompileTime>::run(trLhs,trRhs); 155 } 156 }; 157 158 } // end namespace internal 159 160 /*************************************************************************** 161 * TriangularView methods 162 ***************************************************************************/ 163 164 #ifndef EIGEN_PARSED_BY_DOXYGEN 165 template<typename MatrixType, unsigned int Mode> 166 template<int Side, typename OtherDerived> 167 EIGEN_DEVICE_FUNC void TriangularViewImpl<MatrixType,Mode,Dense>::solveInPlace(const MatrixBase<OtherDerived>& _other) const 168 { 169 OtherDerived& other = _other.const_cast_derived(); 170 eigen_assert( derived().cols() == derived().rows() && ((Side==OnTheLeft && derived().cols() == other.rows()) || (Side==OnTheRight && derived().cols() == other.cols())) ); 171 eigen_assert((!(int(Mode) & int(ZeroDiag))) && bool(int(Mode) & (int(Upper) | int(Lower)))); 172 // If solving for a 0x0 matrix, nothing to do, simply return. 173 if (derived().cols() == 0) 174 return; 175 176 enum { copy = (internal::traits<OtherDerived>::Flags & RowMajorBit) && OtherDerived::IsVectorAtCompileTime && OtherDerived::SizeAtCompileTime!=1}; 177 typedef typename internal::conditional<copy, 178 typename internal::plain_matrix_type_column_major<OtherDerived>::type, OtherDerived&>::type OtherCopy; 179 OtherCopy otherCopy(other); 180 181 internal::triangular_solver_selector<MatrixType, typename internal::remove_reference<OtherCopy>::type, 182 Side, Mode>::run(derived().nestedExpression(), otherCopy); 183 184 if (copy) 185 other = otherCopy; 186 } 187 188 template<typename Derived, unsigned int Mode> 189 template<int Side, typename Other> 190 const internal::triangular_solve_retval<Side,TriangularView<Derived,Mode>,Other> 191 TriangularViewImpl<Derived,Mode,Dense>::solve(const MatrixBase<Other>& other) const 192 { 193 return internal::triangular_solve_retval<Side,TriangularViewType,Other>(derived(), other.derived()); 194 } 195 #endif 196 197 namespace internal { 198 199 200 template<int Side, typename TriangularType, typename Rhs> 201 struct traits<triangular_solve_retval<Side, TriangularType, Rhs> > 202 { 203 typedef typename internal::plain_matrix_type_column_major<Rhs>::type ReturnType; 204 }; 205 206 template<int Side, typename TriangularType, typename Rhs> struct triangular_solve_retval 207 : public ReturnByValue<triangular_solve_retval<Side, TriangularType, Rhs> > 208 { 209 typedef typename remove_all<typename Rhs::Nested>::type RhsNestedCleaned; 210 typedef ReturnByValue<triangular_solve_retval> Base; 211 212 triangular_solve_retval(const TriangularType& tri, const Rhs& rhs) 213 : m_triangularMatrix(tri), m_rhs(rhs) 214 {} 215 216 inline EIGEN_CONSTEXPR Index rows() const EIGEN_NOEXCEPT { return m_rhs.rows(); } 217 inline EIGEN_CONSTEXPR Index cols() const EIGEN_NOEXCEPT { return m_rhs.cols(); } 218 219 template<typename Dest> inline void evalTo(Dest& dst) const 220 { 221 if(!is_same_dense(dst,m_rhs)) 222 dst = m_rhs; 223 m_triangularMatrix.template solveInPlace<Side>(dst); 224 } 225 226 protected: 227 const TriangularType& m_triangularMatrix; 228 typename Rhs::Nested m_rhs; 229 }; 230 231 } // namespace internal 232 233 } // end namespace Eigen 234 235 #endif // EIGEN_SOLVETRIANGULAR_H 236