1c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath/*
2c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath Copyright (c) 2011, Intel Corporation. All rights reserved.
3c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath
4c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath Redistribution and use in source and binary forms, with or without modification,
5c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath are permitted provided that the following conditions are met:
6c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath
7c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath * Redistributions of source code must retain the above copyright notice, this
8c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath   list of conditions and the following disclaimer.
9c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath * Redistributions in binary form must reproduce the above copyright notice,
10c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath   this list of conditions and the following disclaimer in the documentation
11c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath   and/or other materials provided with the distribution.
12c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath * Neither the name of Intel Corporation nor the names of its contributors may
13c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath   be used to endorse or promote products derived from this software without
14c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath   specific prior written permission.
15c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath
16c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
17c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
18c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
19c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR
20c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
21c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
22c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON
23c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
24c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
25c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
26c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath
27c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath ********************************************************************************
28c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath *   Content : Eigen bindings to Intel(R) MKL
29c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath *     LU decomposition with partial pivoting based on LAPACKE_?getrf function.
30c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath ********************************************************************************
31c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath*/
32c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath
33c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath#ifndef EIGEN_PARTIALLU_LAPACK_H
34c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath#define EIGEN_PARTIALLU_LAPACK_H
35c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath
36c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath#include "Eigen/src/Core/util/MKL_support.h"
37c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath
38c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamathnamespace Eigen {
39c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath
40c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamathnamespace internal {
41c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath
42c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath/** \internal Specialization for the data types supported by MKL */
43c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath
44c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath#define EIGEN_MKL_LU_PARTPIV(EIGTYPE, MKLTYPE, MKLPREFIX) \
45c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamathtemplate<int StorageOrder> \
46c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamathstruct partial_lu_impl<EIGTYPE, StorageOrder, lapack_int> \
47c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath{ \
48c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  /* \internal performs the LU decomposition in-place of the matrix represented */ \
49c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  static lapack_int blocked_lu(lapack_int rows, lapack_int cols, EIGTYPE* lu_data, lapack_int luStride, lapack_int* row_transpositions, lapack_int& nb_transpositions, lapack_int maxBlockSize=256) \
50c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  { \
51c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath    EIGEN_UNUSED_VARIABLE(maxBlockSize);\
52c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath    lapack_int matrix_order, first_zero_pivot; \
53c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath    lapack_int m, n, lda, *ipiv, info; \
54c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath    EIGTYPE* a; \
55c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath/* Set up parameters for ?getrf */ \
56c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath    matrix_order = StorageOrder==RowMajor ? LAPACK_ROW_MAJOR : LAPACK_COL_MAJOR; \
57c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath    lda = luStride; \
58c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath    a = lu_data; \
59c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath    ipiv = row_transpositions; \
60c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath    m = rows; \
61c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath    n = cols; \
62c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath    nb_transpositions = 0; \
63c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath\
64c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath    info = LAPACKE_##MKLPREFIX##getrf( matrix_order, m, n, (MKLTYPE*)a, lda, ipiv ); \
65c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath\
66c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath    for(int i=0;i<m;i++) { ipiv[i]--; if (ipiv[i]!=i) nb_transpositions++; } \
67c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath\
68c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath    eigen_assert(info >= 0); \
69c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath/* something should be done with nb_transpositions */ \
70c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath\
71c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath    first_zero_pivot = info; \
72c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath    return first_zero_pivot; \
73c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath  } \
74c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath};
75c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath
76c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan KamathEIGEN_MKL_LU_PARTPIV(double, double, d)
77c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan KamathEIGEN_MKL_LU_PARTPIV(float, float, s)
78c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan KamathEIGEN_MKL_LU_PARTPIV(dcomplex, MKL_Complex16, z)
79c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan KamathEIGEN_MKL_LU_PARTPIV(scomplex, MKL_Complex8, c)
80c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath
81c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath} // end namespace internal
82c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath
83c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath} // end namespace Eigen
84c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath
85c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath#endif // EIGEN_PARTIALLU_LAPACK_H
86