1 // This file is part of Eigen, a lightweight C++ template library
2 // for linear algebra.
3 //
4 // Copyright (C) 2008 Guillaume Saupin <guillaume.saupin@cea.fr>
5 //
6 // This Source Code Form is subject to the terms of the Mozilla
7 // Public License v. 2.0. If a copy of the MPL was not distributed
8 // with this file, You can obtain one at http://mozilla.org/MPL/2.0/.
9 
10 #ifndef EIGEN_SKYLINEINPLACELU_H
11 #define EIGEN_SKYLINEINPLACELU_H
12 
13 namespace Eigen {
14 
15 /** \ingroup Skyline_Module
16  *
17  * \class SkylineInplaceLU
18  *
19  * \brief Inplace LU decomposition of a skyline matrix and associated features
20  *
21  * \param MatrixType the type of the matrix of which we are computing the LU factorization
22  *
23  */
24 template<typename MatrixType>
25 class SkylineInplaceLU {
26 protected:
27     typedef typename MatrixType::Scalar Scalar;
28     typedef typename MatrixType::Index Index;
29 
30     typedef typename NumTraits<typename MatrixType::Scalar>::Real RealScalar;
31 
32 public:
33 
34     /** Creates a LU object and compute the respective factorization of \a matrix using
35      * flags \a flags. */
36     SkylineInplaceLU(MatrixType& matrix, int flags = 0)
37     : /*m_matrix(matrix.rows(), matrix.cols()),*/ m_flags(flags), m_status(0), m_lu(matrix) {
38         m_precision = RealScalar(0.1) * Eigen::dummy_precision<RealScalar > ();
39         m_lu.IsRowMajor ? computeRowMajor() : compute();
40     }
41 
42     /** Sets the relative threshold value used to prune zero coefficients during the decomposition.
43      *
44      * Setting a value greater than zero speeds up computation, and yields to an imcomplete
45      * factorization with fewer non zero coefficients. Such approximate factors are especially
46      * useful to initialize an iterative solver.
47      *
48      * Note that the exact meaning of this parameter might depends on the actual
49      * backend. Moreover, not all backends support this feature.
50      *
51      * \sa precision() */
52     void setPrecision(RealScalar v) {
53         m_precision = v;
54     }
55 
56     /** \returns the current precision.
57      *
58      * \sa setPrecision() */
59     RealScalar precision() const {
60         return m_precision;
61     }
62 
63     /** Sets the flags. Possible values are:
64      *  - CompleteFactorization
65      *  - IncompleteFactorization
66      *  - MemoryEfficient
67      *  - one of the ordering methods
68      *  - etc...
69      *
70      * \sa flags() */
71     void setFlags(int f) {
72         m_flags = f;
73     }
74 
75     /** \returns the current flags */
76     int flags() const {
77         return m_flags;
78     }
79 
80     void setOrderingMethod(int m) {
81         m_flags = m;
82     }
83 
84     int orderingMethod() const {
85         return m_flags;
86     }
87 
88     /** Computes/re-computes the LU factorization */
89     void compute();
90     void computeRowMajor();
91 
92     /** \returns the lower triangular matrix L */
93     //inline const MatrixType& matrixL() const { return m_matrixL; }
94 
95     /** \returns the upper triangular matrix U */
96     //inline const MatrixType& matrixU() const { return m_matrixU; }
97 
98     template<typename BDerived, typename XDerived>
99     bool solve(const MatrixBase<BDerived> &b, MatrixBase<XDerived>* x,
100             const int transposed = 0) const;
101 
102     /** \returns true if the factorization succeeded */
103     inline bool succeeded(void) const {
104         return m_succeeded;
105     }
106 
107 protected:
108     RealScalar m_precision;
109     int m_flags;
110     mutable int m_status;
111     bool m_succeeded;
112     MatrixType& m_lu;
113 };
114 
115 /** Computes / recomputes the in place LU decomposition of the SkylineInplaceLU.
116  * using the default algorithm.
117  */
118 template<typename MatrixType>
119 //template<typename _Scalar>
120 void SkylineInplaceLU<MatrixType>::compute() {
121     const size_t rows = m_lu.rows();
122     const size_t cols = m_lu.cols();
123 
124     eigen_assert(rows == cols && "We do not (yet) support rectangular LU.");
125     eigen_assert(!m_lu.IsRowMajor && "LU decomposition does not work with rowMajor Storage");
126 
127     for (Index row = 0; row < rows; row++) {
128         const double pivot = m_lu.coeffDiag(row);
129 
130         //Lower matrix Columns update
131         const Index& col = row;
132         for (typename MatrixType::InnerLowerIterator lIt(m_lu, col); lIt; ++lIt) {
133             lIt.valueRef() /= pivot;
134         }
135 
136         //Upper matrix update -> contiguous memory access
137         typename MatrixType::InnerLowerIterator lIt(m_lu, col);
138         for (Index rrow = row + 1; rrow < m_lu.rows(); rrow++) {
139             typename MatrixType::InnerUpperIterator uItPivot(m_lu, row);
140             typename MatrixType::InnerUpperIterator uIt(m_lu, rrow);
141             const double coef = lIt.value();
142 
143             uItPivot += (rrow - row - 1);
144 
145             //update upper part  -> contiguous memory access
146             for (++uItPivot; uIt && uItPivot;) {
147                 uIt.valueRef() -= uItPivot.value() * coef;
148 
149                 ++uIt;
150                 ++uItPivot;
151             }
152             ++lIt;
153         }
154 
155         //Upper matrix update -> non contiguous memory access
156         typename MatrixType::InnerLowerIterator lIt3(m_lu, col);
157         for (Index rrow = row + 1; rrow < m_lu.rows(); rrow++) {
158             typename MatrixType::InnerUpperIterator uItPivot(m_lu, row);
159             const double coef = lIt3.value();
160 
161             //update lower part ->  non contiguous memory access
162             for (Index i = 0; i < rrow - row - 1; i++) {
163                 m_lu.coeffRefLower(rrow, row + i + 1) -= uItPivot.value() * coef;
164                 ++uItPivot;
165             }
166             ++lIt3;
167         }
168         //update diag -> contiguous
169         typename MatrixType::InnerLowerIterator lIt2(m_lu, col);
170         for (Index rrow = row + 1; rrow < m_lu.rows(); rrow++) {
171 
172             typename MatrixType::InnerUpperIterator uItPivot(m_lu, row);
173             typename MatrixType::InnerUpperIterator uIt(m_lu, rrow);
174             const double coef = lIt2.value();
175 
176             uItPivot += (rrow - row - 1);
177             m_lu.coeffRefDiag(rrow) -= uItPivot.value() * coef;
178             ++lIt2;
179         }
180     }
181 }
182 
183 template<typename MatrixType>
184 void SkylineInplaceLU<MatrixType>::computeRowMajor() {
185     const size_t rows = m_lu.rows();
186     const size_t cols = m_lu.cols();
187 
188     eigen_assert(rows == cols && "We do not (yet) support rectangular LU.");
189     eigen_assert(m_lu.IsRowMajor && "You're trying to apply rowMajor decomposition on a ColMajor matrix !");
190 
191     for (Index row = 0; row < rows; row++) {
192         typename MatrixType::InnerLowerIterator llIt(m_lu, row);
193 
194 
195         for (Index col = llIt.col(); col < row; col++) {
196             if (m_lu.coeffExistLower(row, col)) {
197                 const double diag = m_lu.coeffDiag(col);
198 
199                 typename MatrixType::InnerLowerIterator lIt(m_lu, row);
200                 typename MatrixType::InnerUpperIterator uIt(m_lu, col);
201 
202 
203                 const Index offset = lIt.col() - uIt.row();
204 
205 
206                 Index stop = offset > 0 ? col - lIt.col() : col - uIt.row();
207 
208                 //#define VECTORIZE
209 #ifdef VECTORIZE
210                 Map<VectorXd > rowVal(lIt.valuePtr() + (offset > 0 ? 0 : -offset), stop);
211                 Map<VectorXd > colVal(uIt.valuePtr() + (offset > 0 ? offset : 0), stop);
212 
213 
214                 Scalar newCoeff = m_lu.coeffLower(row, col) - rowVal.dot(colVal);
215 #else
216                 if (offset > 0) //Skip zero value of lIt
217                     uIt += offset;
218                 else //Skip zero values of uIt
219                     lIt += -offset;
220                 Scalar newCoeff = m_lu.coeffLower(row, col);
221 
222                 for (Index k = 0; k < stop; ++k) {
223                     const Scalar tmp = newCoeff;
224                     newCoeff = tmp - lIt.value() * uIt.value();
225                     ++lIt;
226                     ++uIt;
227                 }
228 #endif
229 
230                 m_lu.coeffRefLower(row, col) = newCoeff / diag;
231             }
232         }
233 
234         //Upper matrix update
235         const Index col = row;
236         typename MatrixType::InnerUpperIterator uuIt(m_lu, col);
237         for (Index rrow = uuIt.row(); rrow < col; rrow++) {
238 
239             typename MatrixType::InnerLowerIterator lIt(m_lu, rrow);
240             typename MatrixType::InnerUpperIterator uIt(m_lu, col);
241             const Index offset = lIt.col() - uIt.row();
242 
243             Index stop = offset > 0 ? rrow - lIt.col() : rrow - uIt.row();
244 
245 #ifdef VECTORIZE
246             Map<VectorXd > rowVal(lIt.valuePtr() + (offset > 0 ? 0 : -offset), stop);
247             Map<VectorXd > colVal(uIt.valuePtr() + (offset > 0 ? offset : 0), stop);
248 
249             Scalar newCoeff = m_lu.coeffUpper(rrow, col) - rowVal.dot(colVal);
250 #else
251             if (offset > 0) //Skip zero value of lIt
252                 uIt += offset;
253             else //Skip zero values of uIt
254                 lIt += -offset;
255             Scalar newCoeff = m_lu.coeffUpper(rrow, col);
256             for (Index k = 0; k < stop; ++k) {
257                 const Scalar tmp = newCoeff;
258                 newCoeff = tmp - lIt.value() * uIt.value();
259 
260                 ++lIt;
261                 ++uIt;
262             }
263 #endif
264             m_lu.coeffRefUpper(rrow, col) = newCoeff;
265         }
266 
267 
268         //Diag matrix update
269         typename MatrixType::InnerLowerIterator lIt(m_lu, row);
270         typename MatrixType::InnerUpperIterator uIt(m_lu, row);
271 
272         const Index offset = lIt.col() - uIt.row();
273 
274 
275         Index stop = offset > 0 ? lIt.size() : uIt.size();
276 #ifdef VECTORIZE
277         Map<VectorXd > rowVal(lIt.valuePtr() + (offset > 0 ? 0 : -offset), stop);
278         Map<VectorXd > colVal(uIt.valuePtr() + (offset > 0 ? offset : 0), stop);
279         Scalar newCoeff = m_lu.coeffDiag(row) - rowVal.dot(colVal);
280 #else
281         if (offset > 0) //Skip zero value of lIt
282             uIt += offset;
283         else //Skip zero values of uIt
284             lIt += -offset;
285         Scalar newCoeff = m_lu.coeffDiag(row);
286         for (Index k = 0; k < stop; ++k) {
287             const Scalar tmp = newCoeff;
288             newCoeff = tmp - lIt.value() * uIt.value();
289             ++lIt;
290             ++uIt;
291         }
292 #endif
293         m_lu.coeffRefDiag(row) = newCoeff;
294     }
295 }
296 
297 /** Computes *x = U^-1 L^-1 b
298  *
299  * If \a transpose is set to SvTranspose or SvAdjoint, the solution
300  * of the transposed/adjoint system is computed instead.
301  *
302  * Not all backends implement the solution of the transposed or
303  * adjoint system.
304  */
305 template<typename MatrixType>
306 template<typename BDerived, typename XDerived>
307 bool SkylineInplaceLU<MatrixType>::solve(const MatrixBase<BDerived> &b, MatrixBase<XDerived>* x, const int transposed) const {
308     const size_t rows = m_lu.rows();
309     const size_t cols = m_lu.cols();
310 
311 
312     for (Index row = 0; row < rows; row++) {
313         x->coeffRef(row) = b.coeff(row);
314         Scalar newVal = x->coeff(row);
315         typename MatrixType::InnerLowerIterator lIt(m_lu, row);
316 
317         Index col = lIt.col();
318         while (lIt.col() < row) {
319 
320             newVal -= x->coeff(col++) * lIt.value();
321             ++lIt;
322         }
323 
324         x->coeffRef(row) = newVal;
325     }
326 
327 
328     for (Index col = rows - 1; col > 0; col--) {
329         x->coeffRef(col) = x->coeff(col) / m_lu.coeffDiag(col);
330 
331         const Scalar x_col = x->coeff(col);
332 
333         typename MatrixType::InnerUpperIterator uIt(m_lu, col);
334         uIt += uIt.size()-1;
335 
336 
337         while (uIt) {
338             x->coeffRef(uIt.row()) -= x_col * uIt.value();
339             //TODO : introduce --operator
340             uIt += -1;
341         }
342 
343 
344     }
345     x->coeffRef(0) = x->coeff(0) / m_lu.coeffDiag(0);
346 
347     return true;
348 }
349 
350 } // end namespace Eigen
351 
352 #endif // EIGEN_SKYLINELU_H
353