1c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath/* 2c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath Copyright (c) 2011, Intel Corporation. All rights reserved. 3c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath 4c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath Redistribution and use in source and binary forms, with or without modification, 5c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath are permitted provided that the following conditions are met: 6c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath 7c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath * Redistributions of source code must retain the above copyright notice, this 8c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath list of conditions and the following disclaimer. 9c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath * Redistributions in binary form must reproduce the above copyright notice, 10c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath this list of conditions and the following disclaimer in the documentation 11c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath and/or other materials provided with the distribution. 12c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath * Neither the name of Intel Corporation nor the names of its contributors may 13c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath be used to endorse or promote products derived from this software without 14c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath specific prior written permission. 15c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath 16c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND 17c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED 18c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE 19c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR 20c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES 21c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; 22c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON 23c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 24c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS 25c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 26c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath 27c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath ******************************************************************************** 28c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath * Content : Eigen bindings to Intel(R) MKL 29c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath * LU decomposition with partial pivoting based on LAPACKE_?getrf function. 30c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath ******************************************************************************** 31c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath*/ 32c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath 33c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath#ifndef EIGEN_PARTIALLU_LAPACK_H 34c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath#define EIGEN_PARTIALLU_LAPACK_H 35c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath 36c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath#include "Eigen/src/Core/util/MKL_support.h" 37c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath 38c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamathnamespace Eigen { 39c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath 40c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamathnamespace internal { 41c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath 42c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath/** \internal Specialization for the data types supported by MKL */ 43c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath 44c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath#define EIGEN_MKL_LU_PARTPIV(EIGTYPE, MKLTYPE, MKLPREFIX) \ 45c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamathtemplate<int StorageOrder> \ 46c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamathstruct partial_lu_impl<EIGTYPE, StorageOrder, lapack_int> \ 47c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath{ \ 48c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath /* \internal performs the LU decomposition in-place of the matrix represented */ \ 49c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath static lapack_int blocked_lu(lapack_int rows, lapack_int cols, EIGTYPE* lu_data, lapack_int luStride, lapack_int* row_transpositions, lapack_int& nb_transpositions, lapack_int maxBlockSize=256) \ 50c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath { \ 51c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath EIGEN_UNUSED_VARIABLE(maxBlockSize);\ 52c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath lapack_int matrix_order, first_zero_pivot; \ 53c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath lapack_int m, n, lda, *ipiv, info; \ 54c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath EIGTYPE* a; \ 55c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath/* Set up parameters for ?getrf */ \ 56c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath matrix_order = StorageOrder==RowMajor ? LAPACK_ROW_MAJOR : LAPACK_COL_MAJOR; \ 57c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath lda = luStride; \ 58c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath a = lu_data; \ 59c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath ipiv = row_transpositions; \ 60c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath m = rows; \ 61c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath n = cols; \ 62c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath nb_transpositions = 0; \ 63c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath\ 64c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath info = LAPACKE_##MKLPREFIX##getrf( matrix_order, m, n, (MKLTYPE*)a, lda, ipiv ); \ 65c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath\ 66c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath for(int i=0;i<m;i++) { ipiv[i]--; if (ipiv[i]!=i) nb_transpositions++; } \ 67c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath\ 68c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath eigen_assert(info >= 0); \ 69c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath/* something should be done with nb_transpositions */ \ 70c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath\ 71c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath first_zero_pivot = info; \ 72c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath return first_zero_pivot; \ 73c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath } \ 74c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath}; 75c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath 76c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan KamathEIGEN_MKL_LU_PARTPIV(double, double, d) 77c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan KamathEIGEN_MKL_LU_PARTPIV(float, float, s) 78c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan KamathEIGEN_MKL_LU_PARTPIV(dcomplex, MKL_Complex16, z) 79c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan KamathEIGEN_MKL_LU_PARTPIV(scomplex, MKL_Complex8, c) 80c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath 81c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath} // end namespace internal 82c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath 83c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath} // end namespace Eigen 84c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath 85c981c48f5bc9aefeffc0bcb0cc3934c2fae179ddNarayan Kamath#endif // EIGEN_PARTIALLU_LAPACK_H 86