TR-mbed 1.0
Loading...
Searching...
No Matches
GeneralProduct.h
Go to the documentation of this file.
1// This file is part of Eigen, a lightweight C++ template library
2// for linear algebra.
3//
4// Copyright (C) 2006-2008 Benoit Jacob <jacob.benoit.1@gmail.com>
5// Copyright (C) 2008-2011 Gael Guennebaud <gael.guennebaud@inria.fr>
6//
7// This Source Code Form is subject to the terms of the Mozilla
8// Public License v. 2.0. If a copy of the MPL was not distributed
9// with this file, You can obtain one at http://mozilla.org/MPL/2.0/.
10
11#ifndef EIGEN_GENERAL_PRODUCT_H
12#define EIGEN_GENERAL_PRODUCT_H
13
14namespace Eigen {
15
16enum {
17 Large = 2,
18 Small = 3
19};
20
21// Define the threshold value to fallback from the generic matrix-matrix product
22// implementation (heavy) to the lightweight coeff-based product one.
23// See generic_product_impl<Lhs,Rhs,DenseShape,DenseShape,GemmProduct>
24// in products/GeneralMatrixMatrix.h for more details.
25// TODO This threshold should also be used in the compile-time selector below.
26#ifndef EIGEN_GEMM_TO_COEFFBASED_THRESHOLD
27// This default value has been obtained on a Haswell architecture.
28#define EIGEN_GEMM_TO_COEFFBASED_THRESHOLD 20
29#endif
30
31namespace internal {
32
33template<int Rows, int Cols, int Depth> struct product_type_selector;
34
35template<int Size, int MaxSize> struct product_size_category
36{
37 enum {
38 #ifndef EIGEN_GPU_COMPILE_PHASE
39 is_large = MaxSize == Dynamic ||
42 #else
43 is_large = 0,
44 #endif
45 value = is_large ? Large
46 : Size == 1 ? 1
47 : Small
48 };
49};
50
51template<typename Lhs, typename Rhs> struct product_type
52{
53 typedef typename remove_all<Lhs>::type _Lhs;
54 typedef typename remove_all<Rhs>::type _Rhs;
55 enum {
64 };
65
66 // the splitting into different lines of code here, introducing the _select enums and the typedef below,
67 // is to work around an internal compiler error with gcc 4.1 and 4.2.
68private:
69 enum {
73 };
74 typedef product_type_selector<rows_select, cols_select, depth_select> selector;
75
76public:
77 enum {
78 value = selector::ret,
79 ret = selector::ret
80 };
81#ifdef EIGEN_DEBUG_PRODUCT
82 static void debug()
83 {
87 EIGEN_DEBUG_VAR(rows_select);
88 EIGEN_DEBUG_VAR(cols_select);
89 EIGEN_DEBUG_VAR(depth_select);
91 }
92#endif
93};
94
95/* The following allows to select the kind of product at compile time
96 * based on the three dimensions of the product.
97 * This is a compile time mapping from {1,Small,Large}^3 -> {product types} */
98// FIXME I'm not sure the current mapping is the ideal one.
99template<int M, int N> struct product_type_selector<M,N,1> { enum { ret = OuterProduct }; };
100template<int M> struct product_type_selector<M, 1, 1> { enum { ret = LazyCoeffBasedProductMode }; };
101template<int N> struct product_type_selector<1, N, 1> { enum { ret = LazyCoeffBasedProductMode }; };
102template<int Depth> struct product_type_selector<1, 1, Depth> { enum { ret = InnerProduct }; };
103template<> struct product_type_selector<1, 1, 1> { enum { ret = InnerProduct }; };
104template<> struct product_type_selector<Small,1, Small> { enum { ret = CoeffBasedProductMode }; };
105template<> struct product_type_selector<1, Small,Small> { enum { ret = CoeffBasedProductMode }; };
107template<> struct product_type_selector<Small, Small, 1> { enum { ret = LazyCoeffBasedProductMode }; };
108template<> struct product_type_selector<Small, Large, 1> { enum { ret = LazyCoeffBasedProductMode }; };
109template<> struct product_type_selector<Large, Small, 1> { enum { ret = LazyCoeffBasedProductMode }; };
110template<> struct product_type_selector<1, Large,Small> { enum { ret = CoeffBasedProductMode }; };
111template<> struct product_type_selector<1, Large,Large> { enum { ret = GemvProduct }; };
112template<> struct product_type_selector<1, Small,Large> { enum { ret = CoeffBasedProductMode }; };
113template<> struct product_type_selector<Large,1, Small> { enum { ret = CoeffBasedProductMode }; };
114template<> struct product_type_selector<Large,1, Large> { enum { ret = GemvProduct }; };
115template<> struct product_type_selector<Small,1, Large> { enum { ret = CoeffBasedProductMode }; };
116template<> struct product_type_selector<Small,Small,Large> { enum { ret = GemmProduct }; };
117template<> struct product_type_selector<Large,Small,Large> { enum { ret = GemmProduct }; };
118template<> struct product_type_selector<Small,Large,Large> { enum { ret = GemmProduct }; };
119template<> struct product_type_selector<Large,Large,Large> { enum { ret = GemmProduct }; };
122template<> struct product_type_selector<Large,Large,Small> { enum { ret = GemmProduct }; };
123
124} // end namespace internal
125
126/***********************************************************************
127* Implementation of Inner Vector Vector Product
128***********************************************************************/
129
130// FIXME : maybe the "inner product" could return a Scalar
131// instead of a 1x1 matrix ??
132// Pro: more natural for the user
133// Cons: this could be a problem if in a meta unrolled algorithm a matrix-matrix
134// product ends up to a row-vector times col-vector product... To tackle this use
135// case, we could have a specialization for Block<MatrixType,1,1> with: operator=(Scalar x);
136
137/***********************************************************************
138* Implementation of Outer Vector Vector Product
139***********************************************************************/
140
141/***********************************************************************
142* Implementation of General Matrix Vector Product
143***********************************************************************/
144
145/* According to the shape/flags of the matrix we have to distinghish 3 different cases:
146 * 1 - the matrix is col-major, BLAS compatible and M is large => call fast BLAS-like colmajor routine
147 * 2 - the matrix is row-major, BLAS compatible and N is large => call fast BLAS-like rowmajor routine
148 * 3 - all other cases are handled using a simple loop along the outer-storage direction.
149 * Therefore we need a lower level meta selector.
150 * Furthermore, if the matrix is the rhs, then the product has to be transposed.
151 */
152namespace internal {
153
154template<int Side, int StorageOrder, bool BlasCompatible>
156
157} // end namespace internal
158
159namespace internal {
160
161template<typename Scalar,int Size,int MaxSize,bool Cond> struct gemv_static_vector_if;
162
163template<typename Scalar,int Size,int MaxSize>
165{
166 EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC Scalar* data() { eigen_internal_assert(false && "should never be called"); return 0; }
167};
168
169template<typename Scalar,int Size>
174
175template<typename Scalar,int Size,int MaxSize>
177{
178 enum {
181 };
182 #if EIGEN_MAX_STATIC_ALIGN_BYTES!=0
184 EIGEN_STRONG_INLINE Scalar* data() { return m_data.array; }
185 #else
186 // Some architectures cannot align on the stack,
187 // => let's manually enforce alignment by allocating more data and return the address of the first aligned element.
190 return ForceAlignment
191 ? reinterpret_cast<Scalar*>((internal::UIntPtr(m_data.array) & ~(std::size_t(EIGEN_MAX_ALIGN_BYTES-1))) + EIGEN_MAX_ALIGN_BYTES)
192 : m_data.array;
193 }
194 #endif
195};
196
197// The vector is on the left => transposition
198template<int StorageOrder, bool BlasCompatible>
200{
201 template<typename Lhs, typename Rhs, typename Dest>
202 static void run(const Lhs &lhs, const Rhs &rhs, Dest& dest, const typename Dest::Scalar& alpha)
203 {
205 enum { OtherStorageOrder = StorageOrder == RowMajor ? ColMajor : RowMajor };
207 ::run(rhs.transpose(), lhs.transpose(), destT, alpha);
208 }
209};
210
212{
213 template<typename Lhs, typename Rhs, typename Dest>
214 static inline void run(const Lhs &lhs, const Rhs &rhs, Dest& dest, const typename Dest::Scalar& alpha)
215 {
216 typedef typename Lhs::Scalar LhsScalar;
217 typedef typename Rhs::Scalar RhsScalar;
218 typedef typename Dest::Scalar ResScalar;
219 typedef typename Dest::RealScalar RealScalar;
220
221 typedef internal::blas_traits<Lhs> LhsBlasTraits;
222 typedef typename LhsBlasTraits::DirectLinearAccessType ActualLhsType;
223 typedef internal::blas_traits<Rhs> RhsBlasTraits;
224 typedef typename RhsBlasTraits::DirectLinearAccessType ActualRhsType;
225
227
228 ActualLhsType actualLhs = LhsBlasTraits::extract(lhs);
229 ActualRhsType actualRhs = RhsBlasTraits::extract(rhs);
230
231 ResScalar actualAlpha = combine_scalar_factors(alpha, lhs, rhs);
232
233 // make sure Dest is a compile-time vector type (bug 1166)
235
236 enum {
237 // FIXME find a way to allow an inner stride on the result if packet_traits<Scalar>::size==1
238 // on, the other hand it is good for the cache to pack the vector anyways...
239 EvalToDestAtCompileTime = (ActualDest::InnerStrideAtCompileTime==1),
241 MightCannotUseDest = ((!EvalToDestAtCompileTime) || ComplexByReal) && (ActualDest::MaxSizeAtCompileTime!=0)
242 };
243
247
249 {
250 // shortcut if we are sure to be able to use dest directly,
251 // this ease the compiler to generate cleaner and more optimzized code for most common cases
253 <Index,LhsScalar,LhsMapper,ColMajor,LhsBlasTraits::NeedToConjugate,RhsScalar,RhsMapper,RhsBlasTraits::NeedToConjugate>::run(
254 actualLhs.rows(), actualLhs.cols(),
255 LhsMapper(actualLhs.data(), actualLhs.outerStride()),
256 RhsMapper(actualRhs.data(), actualRhs.innerStride()),
257 dest.data(), 1,
259 }
260 else
261 {
263
264 const bool alphaIsCompatible = (!ComplexByReal) || (numext::imag(actualAlpha)==RealScalar(0));
266
268 evalToDest ? dest.data() : static_dest.data());
269
270 if(!evalToDest)
271 {
272 #ifdef EIGEN_DENSE_STORAGE_CTOR_PLUGIN
273 Index size = dest.size();
275 #endif
277 {
278 MappedDest(actualDestPtr, dest.size()).setZero();
279 compatibleAlpha = RhsScalar(1);
280 }
281 else
283 }
284
286 <Index,LhsScalar,LhsMapper,ColMajor,LhsBlasTraits::NeedToConjugate,RhsScalar,RhsMapper,RhsBlasTraits::NeedToConjugate>::run(
287 actualLhs.rows(), actualLhs.cols(),
288 LhsMapper(actualLhs.data(), actualLhs.outerStride()),
289 RhsMapper(actualRhs.data(), actualRhs.innerStride()),
290 actualDestPtr, 1,
292
293 if (!evalToDest)
294 {
296 dest.matrix() += actualAlpha * MappedDest(actualDestPtr, dest.size());
297 else
299 }
300 }
301 }
302};
303
305{
306 template<typename Lhs, typename Rhs, typename Dest>
307 static void run(const Lhs &lhs, const Rhs &rhs, Dest& dest, const typename Dest::Scalar& alpha)
308 {
309 typedef typename Lhs::Scalar LhsScalar;
310 typedef typename Rhs::Scalar RhsScalar;
311 typedef typename Dest::Scalar ResScalar;
312
313 typedef internal::blas_traits<Lhs> LhsBlasTraits;
314 typedef typename LhsBlasTraits::DirectLinearAccessType ActualLhsType;
315 typedef internal::blas_traits<Rhs> RhsBlasTraits;
316 typedef typename RhsBlasTraits::DirectLinearAccessType ActualRhsType;
317 typedef typename internal::remove_all<ActualRhsType>::type ActualRhsTypeCleaned;
318
319 typename add_const<ActualLhsType>::type actualLhs = LhsBlasTraits::extract(lhs);
320 typename add_const<ActualRhsType>::type actualRhs = RhsBlasTraits::extract(rhs);
321
322 ResScalar actualAlpha = combine_scalar_factors(alpha, lhs, rhs);
323
324 enum {
325 // FIXME find a way to allow an inner stride on the result if packet_traits<Scalar>::size==1
326 // on, the other hand it is good for the cache to pack the vector anyways...
327 DirectlyUseRhs = ActualRhsTypeCleaned::InnerStrideAtCompileTime==1 || ActualRhsTypeCleaned::MaxSizeAtCompileTime==0
328 };
329
331
333 DirectlyUseRhs ? const_cast<RhsScalar*>(actualRhs.data()) : static_rhs.data());
334
335 if(!DirectlyUseRhs)
336 {
337 #ifdef EIGEN_DENSE_STORAGE_CTOR_PLUGIN
338 Index size = actualRhs.size();
340 #endif
342 }
343
347 <Index,LhsScalar,LhsMapper,RowMajor,LhsBlasTraits::NeedToConjugate,RhsScalar,RhsMapper,RhsBlasTraits::NeedToConjugate>::run(
348 actualLhs.rows(), actualLhs.cols(),
349 LhsMapper(actualLhs.data(), actualLhs.outerStride()),
351 dest.data(), dest.col(0).innerStride(), //NOTE if dest is not a vector at compile-time, then dest.innerStride() might be wrong. (bug 1166)
353 }
354};
355
357{
358 template<typename Lhs, typename Rhs, typename Dest>
359 static void run(const Lhs &lhs, const Rhs &rhs, Dest& dest, const typename Dest::Scalar& alpha)
360 {
361 EIGEN_STATIC_ASSERT((!nested_eval<Lhs,1>::Evaluate),EIGEN_INTERNAL_COMPILATION_ERROR_OR_YOU_MADE_A_PROGRAMMING_MISTAKE);
362 // TODO if rhs is large enough it might be beneficial to make sure that dest is sequentially stored in memory, otherwise use a temp
364 const Index size = rhs.rows();
365 for(Index k=0; k<size; ++k)
366 dest += (alpha*actual_rhs.coeff(k)) * lhs.col(k);
367 }
368};
369
371{
372 template<typename Lhs, typename Rhs, typename Dest>
373 static void run(const Lhs &lhs, const Rhs &rhs, Dest& dest, const typename Dest::Scalar& alpha)
374 {
375 EIGEN_STATIC_ASSERT((!nested_eval<Lhs,1>::Evaluate),EIGEN_INTERNAL_COMPILATION_ERROR_OR_YOU_MADE_A_PROGRAMMING_MISTAKE);
377 const Index rows = dest.rows();
378 for(Index i=0; i<rows; ++i)
379 dest.coeffRef(i) += alpha * (lhs.row(i).cwiseProduct(actual_rhs.transpose())).sum();
380 }
381};
382
383} // end namespace internal
384
385/***************************************************************************
386* Implementation of matrix base methods
387***************************************************************************/
388
395template<typename Derived>
396template<typename OtherDerived>
398const Product<Derived, OtherDerived>
400{
401 // A note regarding the function declaration: In MSVC, this function will sometimes
402 // not be inlined since DenseStorage is an unwindable object for dynamic
403 // matrices and product types are holding a member to store the result.
404 // Thus it does not help tagging this function with EIGEN_STRONG_INLINE.
405 enum {
406 ProductIsValid = Derived::ColsAtCompileTime==Dynamic
407 || OtherDerived::RowsAtCompileTime==Dynamic
408 || int(Derived::ColsAtCompileTime)==int(OtherDerived::RowsAtCompileTime),
409 AreVectors = Derived::IsVectorAtCompileTime && OtherDerived::IsVectorAtCompileTime,
410 SameSizes = EIGEN_PREDICATE_SAME_MATRIX_SIZE(Derived,OtherDerived)
411 };
412 // note to the lost user:
413 // * for a dot product use: v1.dot(v2)
414 // * for a coeff-wise product use: v1.cwiseProduct(v2)
415 EIGEN_STATIC_ASSERT(ProductIsValid || !(AreVectors && SameSizes),
416 INVALID_VECTOR_VECTOR_PRODUCT__IF_YOU_WANTED_A_DOT_OR_COEFF_WISE_PRODUCT_YOU_MUST_USE_THE_EXPLICIT_FUNCTIONS)
417 EIGEN_STATIC_ASSERT(ProductIsValid || !(SameSizes && !AreVectors),
418 INVALID_MATRIX_PRODUCT__IF_YOU_WANTED_A_COEFF_WISE_PRODUCT_YOU_MUST_USE_THE_EXPLICIT_FUNCTION)
419 EIGEN_STATIC_ASSERT(ProductIsValid || SameSizes, INVALID_MATRIX_PRODUCT)
420#ifdef EIGEN_DEBUG_PRODUCT
422#endif
423
424 return Product<Derived, OtherDerived>(derived(), other.derived());
425}
426
438template<typename Derived>
439template<typename OtherDerived>
443{
444 enum {
445 ProductIsValid = Derived::ColsAtCompileTime==Dynamic
446 || OtherDerived::RowsAtCompileTime==Dynamic
447 || int(Derived::ColsAtCompileTime)==int(OtherDerived::RowsAtCompileTime),
448 AreVectors = Derived::IsVectorAtCompileTime && OtherDerived::IsVectorAtCompileTime,
449 SameSizes = EIGEN_PREDICATE_SAME_MATRIX_SIZE(Derived,OtherDerived)
450 };
451 // note to the lost user:
452 // * for a dot product use: v1.dot(v2)
453 // * for a coeff-wise product use: v1.cwiseProduct(v2)
454 EIGEN_STATIC_ASSERT(ProductIsValid || !(AreVectors && SameSizes),
455 INVALID_VECTOR_VECTOR_PRODUCT__IF_YOU_WANTED_A_DOT_OR_COEFF_WISE_PRODUCT_YOU_MUST_USE_THE_EXPLICIT_FUNCTIONS)
456 EIGEN_STATIC_ASSERT(ProductIsValid || !(SameSizes && !AreVectors),
457 INVALID_MATRIX_PRODUCT__IF_YOU_WANTED_A_COEFF_WISE_PRODUCT_YOU_MUST_USE_THE_EXPLICIT_FUNCTION)
458 EIGEN_STATIC_ASSERT(ProductIsValid || SameSizes, INVALID_MATRIX_PRODUCT)
459
460 return Product<Derived,OtherDerived,LazyProduct>(derived(), other.derived());
461}
462
463} // end namespace Eigen
464
465#endif // EIGEN_PRODUCT_H
#define EIGEN_CACHEFRIENDLY_PRODUCT_THRESHOLD
Definition PacketMath.h:18
int i
Definition BiCGSTAB_step_by_step.cpp:9
#define EIGEN_MAX_ALIGN_BYTES
Definition ConfigureVectorization.h:175
#define EIGEN_PLAIN_ENUM_MIN(a, b)
Definition Macros.h:1288
#define eigen_internal_assert(x)
Definition Macros.h:1043
#define EIGEN_DEBUG_VAR(x)
Definition Macros.h:898
#define EIGEN_DEVICE_FUNC
Definition Macros.h:976
#define EIGEN_STRONG_INLINE
Definition Macros.h:917
#define EIGEN_SIZE_MIN_PREFER_FIXED(a, b)
Definition Macros.h:1302
int data[]
Definition Map_placement_new.cpp:1
#define ei_declare_aligned_stack_constructed_variable(TYPE, NAME, SIZE, BUFFER)
Definition Memory.h:768
#define EIGEN_PREDICATE_SAME_MATRIX_SIZE(TYPE0, TYPE1)
Definition StaticAssert.h:174
#define EIGEN_STATIC_ASSERT(CONDITION, MSG)
Definition StaticAssert.h:127
int rows
Definition Tutorial_commainit_02.cpp:1
Scalar Scalar int size
Definition benchVecAdd.cpp:17
SCALAR Scalar
Definition bench_gemm.cpp:46
NumTraits< Scalar >::Real RealScalar
Definition bench_gemm.cpp:47
Base class for all dense matrices, vectors, and expressions.
Definition MatrixBase.h:50
EIGEN_DEVICE_FUNC const Product< Derived, OtherDerived > operator*(const MatrixBase< OtherDerived > &other) const
EIGEN_DEVICE_FUNC const Product< Derived, OtherDerived, LazyProduct > lazyProduct(const MatrixBase< OtherDerived > &other) const
The matrix class, also used for vectors and row-vectors.
Definition Matrix.h:180
Expression of the product of two arbitrary matrices or vectors.
Definition Product.h:75
@ N
Definition constructor.cpp:23
@ AlignedMax
Definition Constants.h:252
@ ColMajor
Definition Constants.h:319
@ RowMajor
Definition Constants.h:321
@ OnTheLeft
Definition Constants.h:332
@ OnTheRight
Definition Constants.h:334
return int(ret)+1
RealScalar alpha
Definition level1_cplx_impl.h:147
DenseIndex ret
Definition level1_cplx_impl.h:44
std::size_t UIntPtr
Definition Meta.h:92
EIGEN_DEVICE_FUNC EIGEN_ALWAYS_INLINE ResScalar combine_scalar_factors(const ResScalar &alpha, const Lhs &lhs, const Rhs &rhs)
Definition BlasUtil.h:568
@ Lhs
Definition TensorContractionMapper.h:19
@ Rhs
Definition TensorContractionMapper.h:18
Namespace containing all symbols from the Eigen library.
Definition bench_norm.cpp:85
@ GemvProduct
Definition Constants.h:500
@ InnerProduct
Definition Constants.h:500
@ CoeffBasedProductMode
Definition Constants.h:500
@ OuterProduct
Definition Constants.h:500
@ GemmProduct
Definition Constants.h:500
@ LazyCoeffBasedProductMode
Definition Constants.h:500
EIGEN_DEFAULT_DENSE_INDEX_TYPE Index
The Index type as used for the API.
Definition Meta.h:74
const int Dynamic
Definition Constants.h:22
@ Small
Definition GeneralProduct.h:18
@ Large
Definition GeneralProduct.h:17
Definition BandTriangularSolver.h:13
Holds information about the various numeric (i.e. scalar) types allowed by Eigen.
Definition NumTraits.h:233
static void run(const Lhs &lhs, const Rhs &rhs, Dest &dest, const typename Dest::Scalar &alpha)
Definition GeneralProduct.h:202
static void run(const Lhs &lhs, const Rhs &rhs, Dest &dest, const typename Dest::Scalar &alpha)
Definition GeneralProduct.h:359
static void run(const Lhs &lhs, const Rhs &rhs, Dest &dest, const typename Dest::Scalar &alpha)
Definition GeneralProduct.h:214
static void run(const Lhs &lhs, const Rhs &rhs, Dest &dest, const typename Dest::Scalar &alpha)
Definition GeneralProduct.h:373
static void run(const Lhs &lhs, const Rhs &rhs, Dest &dest, const typename Dest::Scalar &alpha)
Definition GeneralProduct.h:307
Definition GeneralProduct.h:155
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC Scalar * data()
Definition GeneralProduct.h:172
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC Scalar * data()
Definition GeneralProduct.h:166
EIGEN_STRONG_INLINE Scalar * data()
Definition GeneralProduct.h:189
Definition GeneralProduct.h:161
static EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE To run(const From &x)
Definition BlasUtil.h:43
Definition XprHelper.h:458
Definition GenericPacketMath.h:107
Definition DenseStorage.h:45
T array[Size]
Definition DenseStorage.h:46
Definition GeneralProduct.h:36
Definition GeneralProduct.h:33
Definition GeneralProduct.h:52
@ MaxDepth
Definition GeneralProduct.h:60
@ Cols
Definition GeneralProduct.h:59
@ MaxRows
Definition GeneralProduct.h:56
@ Depth
Definition GeneralProduct.h:62
@ MaxCols
Definition GeneralProduct.h:58
@ Rows
Definition GeneralProduct.h:57
@ value
Definition GeneralProduct.h:78
@ ret
Definition GeneralProduct.h:79
remove_all< Lhs >::type _Lhs
Definition GeneralProduct.h:53
remove_all< Rhs >::type _Rhs
Definition GeneralProduct.h:54
Definition ForwardDeclarations.h:17