1 | // This file is part of Eigen, a lightweight C++ template library |
---|
2 | // for linear algebra. |
---|
3 | // |
---|
4 | // Copyright (C) 2008-2009 Gael Guennebaud <gael.guennebaud@inria.fr> |
---|
5 | // |
---|
6 | // This Source Code Form is subject to the terms of the Mozilla |
---|
7 | // Public License v. 2.0. If a copy of the MPL was not distributed |
---|
8 | // with this file, You can obtain one at http://mozilla.org/MPL/2.0/. |
---|
9 | |
---|
10 | #ifndef EIGEN_SOLVETRIANGULAR_H |
---|
11 | #define EIGEN_SOLVETRIANGULAR_H |
---|
12 | |
---|
13 | namespace Eigen { |
---|
14 | |
---|
15 | namespace internal { |
---|
16 | |
---|
17 | // Forward declarations: |
---|
18 | // The following two routines are implemented in the products/TriangularSolver*.h files |
---|
19 | template<typename LhsScalar, typename RhsScalar, typename Index, int Side, int Mode, bool Conjugate, int StorageOrder> |
---|
20 | struct triangular_solve_vector; |
---|
21 | |
---|
22 | template <typename Scalar, typename Index, int Side, int Mode, bool Conjugate, int TriStorageOrder, int OtherStorageOrder> |
---|
23 | struct triangular_solve_matrix; |
---|
24 | |
---|
25 | // small helper struct extracting some traits on the underlying solver operation |
---|
26 | template<typename Lhs, typename Rhs, int Side> |
---|
27 | class trsolve_traits |
---|
28 | { |
---|
29 | private: |
---|
30 | enum { |
---|
31 | RhsIsVectorAtCompileTime = (Side==OnTheLeft ? Rhs::ColsAtCompileTime : Rhs::RowsAtCompileTime)==1 |
---|
32 | }; |
---|
33 | public: |
---|
34 | enum { |
---|
35 | Unrolling = (RhsIsVectorAtCompileTime && Rhs::SizeAtCompileTime != Dynamic && Rhs::SizeAtCompileTime <= 8) |
---|
36 | ? CompleteUnrolling : NoUnrolling, |
---|
37 | RhsVectors = RhsIsVectorAtCompileTime ? 1 : Dynamic |
---|
38 | }; |
---|
39 | }; |
---|
40 | |
---|
41 | template<typename Lhs, typename Rhs, |
---|
42 | int Side, // can be OnTheLeft/OnTheRight |
---|
43 | int Mode, // can be Upper/Lower | UnitDiag |
---|
44 | int Unrolling = trsolve_traits<Lhs,Rhs,Side>::Unrolling, |
---|
45 | int RhsVectors = trsolve_traits<Lhs,Rhs,Side>::RhsVectors |
---|
46 | > |
---|
47 | struct triangular_solver_selector; |
---|
48 | |
---|
49 | template<typename Lhs, typename Rhs, int Side, int Mode> |
---|
50 | struct triangular_solver_selector<Lhs,Rhs,Side,Mode,NoUnrolling,1> |
---|
51 | { |
---|
52 | typedef typename Lhs::Scalar LhsScalar; |
---|
53 | typedef typename Rhs::Scalar RhsScalar; |
---|
54 | typedef blas_traits<Lhs> LhsProductTraits; |
---|
55 | typedef typename LhsProductTraits::ExtractType ActualLhsType; |
---|
56 | typedef Map<Matrix<RhsScalar,Dynamic,1>, Aligned> MappedRhs; |
---|
57 | static void run(const Lhs& lhs, Rhs& rhs) |
---|
58 | { |
---|
59 | ActualLhsType actualLhs = LhsProductTraits::extract(lhs); |
---|
60 | |
---|
61 | // FIXME find a way to allow an inner stride if packet_traits<Scalar>::size==1 |
---|
62 | |
---|
63 | bool useRhsDirectly = Rhs::InnerStrideAtCompileTime==1 || rhs.innerStride()==1; |
---|
64 | |
---|
65 | ei_declare_aligned_stack_constructed_variable(RhsScalar,actualRhs,rhs.size(), |
---|
66 | (useRhsDirectly ? rhs.data() : 0)); |
---|
67 | |
---|
68 | if(!useRhsDirectly) |
---|
69 | MappedRhs(actualRhs,rhs.size()) = rhs; |
---|
70 | |
---|
71 | triangular_solve_vector<LhsScalar, RhsScalar, typename Lhs::Index, Side, Mode, LhsProductTraits::NeedToConjugate, |
---|
72 | (int(Lhs::Flags) & RowMajorBit) ? RowMajor : ColMajor> |
---|
73 | ::run(actualLhs.cols(), actualLhs.data(), actualLhs.outerStride(), actualRhs); |
---|
74 | |
---|
75 | if(!useRhsDirectly) |
---|
76 | rhs = MappedRhs(actualRhs, rhs.size()); |
---|
77 | } |
---|
78 | }; |
---|
79 | |
---|
80 | // the rhs is a matrix |
---|
81 | template<typename Lhs, typename Rhs, int Side, int Mode> |
---|
82 | struct triangular_solver_selector<Lhs,Rhs,Side,Mode,NoUnrolling,Dynamic> |
---|
83 | { |
---|
84 | typedef typename Rhs::Scalar Scalar; |
---|
85 | typedef typename Rhs::Index Index; |
---|
86 | typedef blas_traits<Lhs> LhsProductTraits; |
---|
87 | typedef typename LhsProductTraits::DirectLinearAccessType ActualLhsType; |
---|
88 | |
---|
89 | static void run(const Lhs& lhs, Rhs& rhs) |
---|
90 | { |
---|
91 | typename internal::add_const_on_value_type<ActualLhsType>::type actualLhs = LhsProductTraits::extract(lhs); |
---|
92 | |
---|
93 | const Index size = lhs.rows(); |
---|
94 | const Index othersize = Side==OnTheLeft? rhs.cols() : rhs.rows(); |
---|
95 | |
---|
96 | typedef internal::gemm_blocking_space<(Rhs::Flags&RowMajorBit) ? RowMajor : ColMajor,Scalar,Scalar, |
---|
97 | Rhs::MaxRowsAtCompileTime, Rhs::MaxColsAtCompileTime, Lhs::MaxRowsAtCompileTime,4> BlockingType; |
---|
98 | |
---|
99 | BlockingType blocking(rhs.rows(), rhs.cols(), size); |
---|
100 | |
---|
101 | triangular_solve_matrix<Scalar,Index,Side,Mode,LhsProductTraits::NeedToConjugate,(int(Lhs::Flags) & RowMajorBit) ? RowMajor : ColMajor, |
---|
102 | (Rhs::Flags&RowMajorBit) ? RowMajor : ColMajor> |
---|
103 | ::run(size, othersize, &actualLhs.coeffRef(0,0), actualLhs.outerStride(), &rhs.coeffRef(0,0), rhs.outerStride(), blocking); |
---|
104 | } |
---|
105 | }; |
---|
106 | |
---|
107 | /*************************************************************************** |
---|
108 | * meta-unrolling implementation |
---|
109 | ***************************************************************************/ |
---|
110 | |
---|
111 | template<typename Lhs, typename Rhs, int Mode, int Index, int Size, |
---|
112 | bool Stop = Index==Size> |
---|
113 | struct triangular_solver_unroller; |
---|
114 | |
---|
115 | template<typename Lhs, typename Rhs, int Mode, int Index, int Size> |
---|
116 | struct triangular_solver_unroller<Lhs,Rhs,Mode,Index,Size,false> { |
---|
117 | enum { |
---|
118 | IsLower = ((Mode&Lower)==Lower), |
---|
119 | I = IsLower ? Index : Size - Index - 1, |
---|
120 | S = IsLower ? 0 : I+1 |
---|
121 | }; |
---|
122 | static void run(const Lhs& lhs, Rhs& rhs) |
---|
123 | { |
---|
124 | if (Index>0) |
---|
125 | rhs.coeffRef(I) -= lhs.row(I).template segment<Index>(S).transpose() |
---|
126 | .cwiseProduct(rhs.template segment<Index>(S)).sum(); |
---|
127 | |
---|
128 | if(!(Mode & UnitDiag)) |
---|
129 | rhs.coeffRef(I) /= lhs.coeff(I,I); |
---|
130 | |
---|
131 | triangular_solver_unroller<Lhs,Rhs,Mode,Index+1,Size>::run(lhs,rhs); |
---|
132 | } |
---|
133 | }; |
---|
134 | |
---|
135 | template<typename Lhs, typename Rhs, int Mode, int Index, int Size> |
---|
136 | struct triangular_solver_unroller<Lhs,Rhs,Mode,Index,Size,true> { |
---|
137 | static void run(const Lhs&, Rhs&) {} |
---|
138 | }; |
---|
139 | |
---|
140 | template<typename Lhs, typename Rhs, int Mode> |
---|
141 | struct triangular_solver_selector<Lhs,Rhs,OnTheLeft,Mode,CompleteUnrolling,1> { |
---|
142 | static void run(const Lhs& lhs, Rhs& rhs) |
---|
143 | { triangular_solver_unroller<Lhs,Rhs,Mode,0,Rhs::SizeAtCompileTime>::run(lhs,rhs); } |
---|
144 | }; |
---|
145 | |
---|
146 | template<typename Lhs, typename Rhs, int Mode> |
---|
147 | struct triangular_solver_selector<Lhs,Rhs,OnTheRight,Mode,CompleteUnrolling,1> { |
---|
148 | static void run(const Lhs& lhs, Rhs& rhs) |
---|
149 | { |
---|
150 | Transpose<const Lhs> trLhs(lhs); |
---|
151 | Transpose<Rhs> trRhs(rhs); |
---|
152 | |
---|
153 | triangular_solver_unroller<Transpose<const Lhs>,Transpose<Rhs>, |
---|
154 | ((Mode&Upper)==Upper ? Lower : Upper) | (Mode&UnitDiag), |
---|
155 | 0,Rhs::SizeAtCompileTime>::run(trLhs,trRhs); |
---|
156 | } |
---|
157 | }; |
---|
158 | |
---|
159 | } // end namespace internal |
---|
160 | |
---|
161 | /*************************************************************************** |
---|
162 | * TriangularView methods |
---|
163 | ***************************************************************************/ |
---|
164 | |
---|
165 | /** "in-place" version of TriangularView::solve() where the result is written in \a other |
---|
166 | * |
---|
167 | * \warning The parameter is only marked 'const' to make the C++ compiler accept a temporary expression here. |
---|
168 | * This function will const_cast it, so constness isn't honored here. |
---|
169 | * |
---|
170 | * See TriangularView:solve() for the details. |
---|
171 | */ |
---|
172 | template<typename MatrixType, unsigned int Mode> |
---|
173 | template<int Side, typename OtherDerived> |
---|
174 | void TriangularView<MatrixType,Mode>::solveInPlace(const MatrixBase<OtherDerived>& _other) const |
---|
175 | { |
---|
176 | OtherDerived& other = _other.const_cast_derived(); |
---|
177 | eigen_assert( cols() == rows() && ((Side==OnTheLeft && cols() == other.rows()) || (Side==OnTheRight && cols() == other.cols())) ); |
---|
178 | eigen_assert((!(Mode & ZeroDiag)) && bool(Mode & (Upper|Lower))); |
---|
179 | |
---|
180 | enum { copy = internal::traits<OtherDerived>::Flags & RowMajorBit && OtherDerived::IsVectorAtCompileTime }; |
---|
181 | typedef typename internal::conditional<copy, |
---|
182 | typename internal::plain_matrix_type_column_major<OtherDerived>::type, OtherDerived&>::type OtherCopy; |
---|
183 | OtherCopy otherCopy(other); |
---|
184 | |
---|
185 | internal::triangular_solver_selector<MatrixType, typename internal::remove_reference<OtherCopy>::type, |
---|
186 | Side, Mode>::run(nestedExpression(), otherCopy); |
---|
187 | |
---|
188 | if (copy) |
---|
189 | other = otherCopy; |
---|
190 | } |
---|
191 | |
---|
192 | /** \returns the product of the inverse of \c *this with \a other, \a *this being triangular. |
---|
193 | * |
---|
194 | * This function computes the inverse-matrix matrix product inverse(\c *this) * \a other if |
---|
195 | * \a Side==OnTheLeft (the default), or the right-inverse-multiply \a other * inverse(\c *this) if |
---|
196 | * \a Side==OnTheRight. |
---|
197 | * |
---|
198 | * The matrix \c *this must be triangular and invertible (i.e., all the coefficients of the |
---|
199 | * diagonal must be non zero). It works as a forward (resp. backward) substitution if \c *this |
---|
200 | * is an upper (resp. lower) triangular matrix. |
---|
201 | * |
---|
202 | * Example: \include MatrixBase_marked.cpp |
---|
203 | * Output: \verbinclude MatrixBase_marked.out |
---|
204 | * |
---|
205 | * This function returns an expression of the inverse-multiply and can works in-place if it is assigned |
---|
206 | * to the same matrix or vector \a other. |
---|
207 | * |
---|
208 | * For users coming from BLAS, this function (and more specifically solveInPlace()) offer |
---|
209 | * all the operations supported by the \c *TRSV and \c *TRSM BLAS routines. |
---|
210 | * |
---|
211 | * \sa TriangularView::solveInPlace() |
---|
212 | */ |
---|
213 | template<typename Derived, unsigned int Mode> |
---|
214 | template<int Side, typename Other> |
---|
215 | const internal::triangular_solve_retval<Side,TriangularView<Derived,Mode>,Other> |
---|
216 | TriangularView<Derived,Mode>::solve(const MatrixBase<Other>& other) const |
---|
217 | { |
---|
218 | return internal::triangular_solve_retval<Side,TriangularView,Other>(*this, other.derived()); |
---|
219 | } |
---|
220 | |
---|
221 | namespace internal { |
---|
222 | |
---|
223 | |
---|
224 | template<int Side, typename TriangularType, typename Rhs> |
---|
225 | struct traits<triangular_solve_retval<Side, TriangularType, Rhs> > |
---|
226 | { |
---|
227 | typedef typename internal::plain_matrix_type_column_major<Rhs>::type ReturnType; |
---|
228 | }; |
---|
229 | |
---|
230 | template<int Side, typename TriangularType, typename Rhs> struct triangular_solve_retval |
---|
231 | : public ReturnByValue<triangular_solve_retval<Side, TriangularType, Rhs> > |
---|
232 | { |
---|
233 | typedef typename remove_all<typename Rhs::Nested>::type RhsNestedCleaned; |
---|
234 | typedef ReturnByValue<triangular_solve_retval> Base; |
---|
235 | typedef typename Base::Index Index; |
---|
236 | |
---|
237 | triangular_solve_retval(const TriangularType& tri, const Rhs& rhs) |
---|
238 | : m_triangularMatrix(tri), m_rhs(rhs) |
---|
239 | {} |
---|
240 | |
---|
241 | inline Index rows() const { return m_rhs.rows(); } |
---|
242 | inline Index cols() const { return m_rhs.cols(); } |
---|
243 | |
---|
244 | template<typename Dest> inline void evalTo(Dest& dst) const |
---|
245 | { |
---|
246 | if(!(is_same<RhsNestedCleaned,Dest>::value && extract_data(dst) == extract_data(m_rhs))) |
---|
247 | dst = m_rhs; |
---|
248 | m_triangularMatrix.template solveInPlace<Side>(dst); |
---|
249 | } |
---|
250 | |
---|
251 | protected: |
---|
252 | const TriangularType& m_triangularMatrix; |
---|
253 | typename Rhs::Nested m_rhs; |
---|
254 | }; |
---|
255 | |
---|
256 | } // namespace internal |
---|
257 | |
---|
258 | } // end namespace Eigen |
---|
259 | |
---|
260 | #endif // EIGEN_SOLVETRIANGULAR_H |
---|