1 | /*
|
---|
2 | Copyright (c) 2011, Intel Corporation. All rights reserved.
|
---|
3 |
|
---|
4 | Redistribution and use in source and binary forms, with or without modification,
|
---|
5 | are permitted provided that the following conditions are met:
|
---|
6 |
|
---|
7 | * Redistributions of source code must retain the above copyright notice, this
|
---|
8 | list of conditions and the following disclaimer.
|
---|
9 | * Redistributions in binary form must reproduce the above copyright notice,
|
---|
10 | this list of conditions and the following disclaimer in the documentation
|
---|
11 | and/or other materials provided with the distribution.
|
---|
12 | * Neither the name of Intel Corporation nor the names of its contributors may
|
---|
13 | be used to endorse or promote products derived from this software without
|
---|
14 | specific prior written permission.
|
---|
15 |
|
---|
16 | THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
|
---|
17 | ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
|
---|
18 | WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
|
---|
19 | DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR
|
---|
20 | ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
|
---|
21 | (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
|
---|
22 | LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON
|
---|
23 | ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
---|
24 | (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
|
---|
25 | SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
---|
26 |
|
---|
27 | ********************************************************************************
|
---|
28 | * Content : Eigen bindings to Intel(R) MKL
|
---|
29 | * Level 3 BLAS SYRK/HERK implementation.
|
---|
30 | ********************************************************************************
|
---|
31 | */
|
---|
32 |
|
---|
33 | #ifndef EIGEN_GENERAL_MATRIX_MATRIX_TRIANGULAR_MKL_H
|
---|
34 | #define EIGEN_GENERAL_MATRIX_MATRIX_TRIANGULAR_MKL_H
|
---|
35 |
|
---|
36 | namespace Eigen {
|
---|
37 |
|
---|
38 | namespace internal {
|
---|
39 |
|
---|
40 | template <typename Index, typename Scalar, int AStorageOrder, bool ConjugateA, int ResStorageOrder, int UpLo>
|
---|
41 | struct general_matrix_matrix_rankupdate :
|
---|
42 | general_matrix_matrix_triangular_product<
|
---|
43 | Index,Scalar,AStorageOrder,ConjugateA,Scalar,AStorageOrder,ConjugateA,ResStorageOrder,UpLo,BuiltIn> {};
|
---|
44 |
|
---|
45 |
|
---|
46 | // try to go to BLAS specialization
|
---|
47 | #define EIGEN_MKL_RANKUPDATE_SPECIALIZE(Scalar) \
|
---|
48 | template <typename Index, int LhsStorageOrder, bool ConjugateLhs, \
|
---|
49 | int RhsStorageOrder, bool ConjugateRhs, int UpLo> \
|
---|
50 | struct general_matrix_matrix_triangular_product<Index,Scalar,LhsStorageOrder,ConjugateLhs, \
|
---|
51 | Scalar,RhsStorageOrder,ConjugateRhs,ColMajor,UpLo,Specialized> { \
|
---|
52 | static EIGEN_STRONG_INLINE void run(Index size, Index depth,const Scalar* lhs, Index lhsStride, \
|
---|
53 | const Scalar* rhs, Index rhsStride, Scalar* res, Index resStride, Scalar alpha) \
|
---|
54 | { \
|
---|
55 | if (lhs==rhs) { \
|
---|
56 | general_matrix_matrix_rankupdate<Index,Scalar,LhsStorageOrder,ConjugateLhs,ColMajor,UpLo> \
|
---|
57 | ::run(size,depth,lhs,lhsStride,rhs,rhsStride,res,resStride,alpha); \
|
---|
58 | } else { \
|
---|
59 | general_matrix_matrix_triangular_product<Index, \
|
---|
60 | Scalar, LhsStorageOrder, ConjugateLhs, \
|
---|
61 | Scalar, RhsStorageOrder, ConjugateRhs, \
|
---|
62 | ColMajor, UpLo, BuiltIn> \
|
---|
63 | ::run(size,depth,lhs,lhsStride,rhs,rhsStride,res,resStride,alpha); \
|
---|
64 | } \
|
---|
65 | } \
|
---|
66 | };
|
---|
67 |
|
---|
68 | EIGEN_MKL_RANKUPDATE_SPECIALIZE(double)
|
---|
69 | //EIGEN_MKL_RANKUPDATE_SPECIALIZE(dcomplex)
|
---|
70 | EIGEN_MKL_RANKUPDATE_SPECIALIZE(float)
|
---|
71 | //EIGEN_MKL_RANKUPDATE_SPECIALIZE(scomplex)
|
---|
72 |
|
---|
73 | // SYRK for float/double
|
---|
74 | #define EIGEN_MKL_RANKUPDATE_R(EIGTYPE, MKLTYPE, MKLFUNC) \
|
---|
75 | template <typename Index, int AStorageOrder, bool ConjugateA, int UpLo> \
|
---|
76 | struct general_matrix_matrix_rankupdate<Index,EIGTYPE,AStorageOrder,ConjugateA,ColMajor,UpLo> { \
|
---|
77 | enum { \
|
---|
78 | IsLower = (UpLo&Lower) == Lower, \
|
---|
79 | LowUp = IsLower ? Lower : Upper, \
|
---|
80 | conjA = ((AStorageOrder==ColMajor) && ConjugateA) ? 1 : 0 \
|
---|
81 | }; \
|
---|
82 | static EIGEN_STRONG_INLINE void run(Index size, Index depth,const EIGTYPE* lhs, Index lhsStride, \
|
---|
83 | const EIGTYPE* rhs, Index rhsStride, EIGTYPE* res, Index resStride, EIGTYPE alpha) \
|
---|
84 | { \
|
---|
85 | /* typedef Matrix<EIGTYPE, Dynamic, Dynamic, RhsStorageOrder> MatrixRhs;*/ \
|
---|
86 | \
|
---|
87 | MKL_INT lda=lhsStride, ldc=resStride, n=size, k=depth; \
|
---|
88 | char uplo=(IsLower) ? 'L' : 'U', trans=(AStorageOrder==RowMajor) ? 'T':'N'; \
|
---|
89 | MKLTYPE alpha_, beta_; \
|
---|
90 | \
|
---|
91 | /* Set alpha_ & beta_ */ \
|
---|
92 | assign_scalar_eig2mkl<MKLTYPE, EIGTYPE>(alpha_, alpha); \
|
---|
93 | assign_scalar_eig2mkl<MKLTYPE, EIGTYPE>(beta_, EIGTYPE(1)); \
|
---|
94 | MKLFUNC(&uplo, &trans, &n, &k, &alpha_, lhs, &lda, &beta_, res, &ldc); \
|
---|
95 | } \
|
---|
96 | };
|
---|
97 |
|
---|
98 | // HERK for complex data
|
---|
99 | #define EIGEN_MKL_RANKUPDATE_C(EIGTYPE, MKLTYPE, RTYPE, MKLFUNC) \
|
---|
100 | template <typename Index, int AStorageOrder, bool ConjugateA, int UpLo> \
|
---|
101 | struct general_matrix_matrix_rankupdate<Index,EIGTYPE,AStorageOrder,ConjugateA,ColMajor,UpLo> { \
|
---|
102 | enum { \
|
---|
103 | IsLower = (UpLo&Lower) == Lower, \
|
---|
104 | LowUp = IsLower ? Lower : Upper, \
|
---|
105 | conjA = (((AStorageOrder==ColMajor) && ConjugateA) || ((AStorageOrder==RowMajor) && !ConjugateA)) ? 1 : 0 \
|
---|
106 | }; \
|
---|
107 | static EIGEN_STRONG_INLINE void run(Index size, Index depth,const EIGTYPE* lhs, Index lhsStride, \
|
---|
108 | const EIGTYPE* rhs, Index rhsStride, EIGTYPE* res, Index resStride, EIGTYPE alpha) \
|
---|
109 | { \
|
---|
110 | typedef Matrix<EIGTYPE, Dynamic, Dynamic, AStorageOrder> MatrixType; \
|
---|
111 | \
|
---|
112 | MKL_INT lda=lhsStride, ldc=resStride, n=size, k=depth; \
|
---|
113 | char uplo=(IsLower) ? 'L' : 'U', trans=(AStorageOrder==RowMajor) ? 'C':'N'; \
|
---|
114 | RTYPE alpha_, beta_; \
|
---|
115 | const EIGTYPE* a_ptr; \
|
---|
116 | \
|
---|
117 | /* Set alpha_ & beta_ */ \
|
---|
118 | /* assign_scalar_eig2mkl<MKLTYPE, EIGTYPE>(alpha_, alpha); */\
|
---|
119 | /* assign_scalar_eig2mkl<MKLTYPE, EIGTYPE>(beta_, EIGTYPE(1));*/ \
|
---|
120 | alpha_ = alpha.real(); \
|
---|
121 | beta_ = 1.0; \
|
---|
122 | /* Copy with conjugation in some cases*/ \
|
---|
123 | MatrixType a; \
|
---|
124 | if (conjA) { \
|
---|
125 | Map<const MatrixType, 0, OuterStride<> > mapA(lhs,n,k,OuterStride<>(lhsStride)); \
|
---|
126 | a = mapA.conjugate(); \
|
---|
127 | lda = a.outerStride(); \
|
---|
128 | a_ptr = a.data(); \
|
---|
129 | } else a_ptr=lhs; \
|
---|
130 | MKLFUNC(&uplo, &trans, &n, &k, &alpha_, (MKLTYPE*)a_ptr, &lda, &beta_, (MKLTYPE*)res, &ldc); \
|
---|
131 | } \
|
---|
132 | };
|
---|
133 |
|
---|
134 |
|
---|
135 | EIGEN_MKL_RANKUPDATE_R(double, double, dsyrk)
|
---|
136 | EIGEN_MKL_RANKUPDATE_R(float, float, ssyrk)
|
---|
137 |
|
---|
138 | //EIGEN_MKL_RANKUPDATE_C(dcomplex, MKL_Complex16, double, zherk)
|
---|
139 | //EIGEN_MKL_RANKUPDATE_C(scomplex, MKL_Complex8, double, cherk)
|
---|
140 |
|
---|
141 |
|
---|
142 | } // end namespace internal
|
---|
143 |
|
---|
144 | } // end namespace Eigen
|
---|
145 |
|
---|
146 | #endif // EIGEN_GENERAL_MATRIX_MATRIX_TRIANGULAR_MKL_H
|
---|