11#ifndef EIGEN_GENERAL_PRODUCT_H
12#define EIGEN_GENERAL_PRODUCT_H
14#include "./InternalHeaderCheck.h"
28#ifndef EIGEN_GEMM_TO_COEFFBASED_THRESHOLD
30#define EIGEN_GEMM_TO_COEFFBASED_THRESHOLD 20
35template<
int Rows,
int Cols,
int Depth>
struct product_type_selector;
37template<
int Size,
int MaxSize>
struct product_size_category
40 #ifndef EIGEN_GPU_COMPILE_PHASE
41 is_large = MaxSize ==
Dynamic ||
42 Size >= EIGEN_CACHEFRIENDLY_PRODUCT_THRESHOLD ||
43 (Size==
Dynamic && MaxSize>=EIGEN_CACHEFRIENDLY_PRODUCT_THRESHOLD),
47 value = is_large ? Large
53template<
typename Lhs,
typename Rhs>
struct product_type
55 typedef typename remove_all<Lhs>::type _Lhs;
56 typedef typename remove_all<Rhs>::type _Rhs;
58 MaxRows = traits<_Lhs>::MaxRowsAtCompileTime,
59 Rows = traits<_Lhs>::RowsAtCompileTime,
60 MaxCols = traits<_Rhs>::MaxColsAtCompileTime,
61 Cols = traits<_Rhs>::ColsAtCompileTime,
62 MaxDepth = min_size_prefer_fixed(traits<_Lhs>::MaxColsAtCompileTime,
63 traits<_Rhs>::MaxRowsAtCompileTime),
64 Depth = min_size_prefer_fixed(traits<_Lhs>::ColsAtCompileTime,
65 traits<_Rhs>::RowsAtCompileTime)
72 rows_select = product_size_category<Rows,MaxRows>::value,
73 cols_select = product_size_category<Cols,MaxCols>::value,
74 depth_select = product_size_category<Depth,MaxDepth>::value
76 typedef product_type_selector<rows_select, cols_select, depth_select> selector;
80 value = selector::ret,
83#ifdef EIGEN_DEBUG_PRODUCT
86 EIGEN_DEBUG_VAR(Rows);
87 EIGEN_DEBUG_VAR(Cols);
88 EIGEN_DEBUG_VAR(Depth);
89 EIGEN_DEBUG_VAR(rows_select);
90 EIGEN_DEBUG_VAR(cols_select);
91 EIGEN_DEBUG_VAR(depth_select);
92 EIGEN_DEBUG_VAR(value);
101template<
int M,
int N>
struct product_type_selector<M,N,1> {
enum { ret = OuterProduct }; };
102template<
int M>
struct product_type_selector<M, 1, 1> {
enum { ret = LazyCoeffBasedProductMode }; };
103template<
int N>
struct product_type_selector<1, N, 1> {
enum { ret = LazyCoeffBasedProductMode }; };
104template<
int Depth>
struct product_type_selector<1, 1, Depth> {
enum { ret = InnerProduct }; };
105template<>
struct product_type_selector<1, 1, 1> {
enum { ret = InnerProduct }; };
106template<>
struct product_type_selector<Small,1, Small> {
enum { ret = CoeffBasedProductMode }; };
107template<>
struct product_type_selector<1, Small,Small> {
enum { ret = CoeffBasedProductMode }; };
108template<>
struct product_type_selector<Small,Small,Small> {
enum { ret = CoeffBasedProductMode }; };
109template<>
struct product_type_selector<Small, Small, 1> {
enum { ret = LazyCoeffBasedProductMode }; };
110template<>
struct product_type_selector<Small, Large, 1> {
enum { ret = LazyCoeffBasedProductMode }; };
111template<>
struct product_type_selector<Large, Small, 1> {
enum { ret = LazyCoeffBasedProductMode }; };
112template<>
struct product_type_selector<1, Large,Small> {
enum { ret = CoeffBasedProductMode }; };
113template<>
struct product_type_selector<1, Large,Large> {
enum { ret = GemvProduct }; };
114template<>
struct product_type_selector<1, Small,Large> {
enum { ret = CoeffBasedProductMode }; };
115template<>
struct product_type_selector<Large,1, Small> {
enum { ret = CoeffBasedProductMode }; };
116template<>
struct product_type_selector<Large,1, Large> {
enum { ret = GemvProduct }; };
117template<>
struct product_type_selector<Small,1, Large> {
enum { ret = CoeffBasedProductMode }; };
118template<>
struct product_type_selector<Small,Small,Large> {
enum { ret = GemmProduct }; };
119template<>
struct product_type_selector<Large,Small,Large> {
enum { ret = GemmProduct }; };
120template<>
struct product_type_selector<Small,Large,Large> {
enum { ret = GemmProduct }; };
121template<>
struct product_type_selector<Large,Large,Large> {
enum { ret = GemmProduct }; };
122template<>
struct product_type_selector<Large,Small,Small> {
enum { ret = CoeffBasedProductMode }; };
123template<>
struct product_type_selector<Small,Large,Small> {
enum { ret = CoeffBasedProductMode }; };
124template<>
struct product_type_selector<Large,Large,Small> {
enum { ret = GemmProduct }; };
156template<
int S
ide,
int StorageOrder,
bool BlasCompatible>
157struct gemv_dense_selector;
163template<
typename Scalar,
int Size,
int MaxSize,
bool Cond>
struct gemv_static_vector_if;
165template<
typename Scalar,
int Size,
int MaxSize>
166struct gemv_static_vector_if<Scalar,Size,MaxSize,false>
168 EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC
Scalar* data() { eigen_internal_assert(
false &&
"should never be called");
return 0; }
171template<
typename Scalar,
int Size>
172struct gemv_static_vector_if<Scalar,Size,
Dynamic,true>
174 EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC
Scalar* data() {
return 0; }
177template<
typename Scalar,
int Size,
int MaxSize>
178struct gemv_static_vector_if<Scalar,Size,MaxSize,true>
181 ForceAlignment = internal::packet_traits<Scalar>::Vectorizable,
182 PacketSize = internal::packet_traits<Scalar>::size
184 #if EIGEN_MAX_STATIC_ALIGN_BYTES!=0
185 internal::plain_array<Scalar, internal::min_size_prefer_fixed(Size, MaxSize), 0,
186 internal::plain_enum_min(AlignedMax, PacketSize)> m_data;
187 EIGEN_STRONG_INLINE Scalar* data() {
return m_data.array; }
191 internal::plain_array<Scalar, internal::min_size_prefer_fixed(Size, MaxSize)+(ForceAlignment?EIGEN_MAX_ALIGN_BYTES:0),0> m_data;
192 EIGEN_STRONG_INLINE Scalar* data() {
193 return ForceAlignment
194 ?
reinterpret_cast<Scalar*
>((internal::UIntPtr(m_data.array) & ~(std::size_t(EIGEN_MAX_ALIGN_BYTES-1))) + EIGEN_MAX_ALIGN_BYTES)
201template<
int StorageOrder,
bool BlasCompatible>
202struct gemv_dense_selector<
OnTheLeft,StorageOrder,BlasCompatible>
204 template<
typename Lhs,
typename Rhs,
typename Dest>
205 static void run(
const Lhs &lhs,
const Rhs &rhs, Dest& dest,
const typename Dest::Scalar& alpha)
207 Transpose<Dest> destT(dest);
209 gemv_dense_selector<OnTheRight,OtherStorageOrder,BlasCompatible>
210 ::run(rhs.transpose(), lhs.transpose(), destT, alpha);
216 template<
typename Lhs,
typename Rhs,
typename Dest>
217 static inline void run(
const Lhs &lhs,
const Rhs &rhs, Dest& dest,
const typename Dest::Scalar& alpha)
219 typedef typename Lhs::Scalar LhsScalar;
220 typedef typename Rhs::Scalar RhsScalar;
221 typedef typename Dest::Scalar ResScalar;
222 typedef typename Dest::RealScalar RealScalar;
224 typedef internal::blas_traits<Lhs> LhsBlasTraits;
225 typedef typename LhsBlasTraits::DirectLinearAccessType ActualLhsType;
226 typedef internal::blas_traits<Rhs> RhsBlasTraits;
227 typedef typename RhsBlasTraits::DirectLinearAccessType ActualRhsType;
229 typedef Map<Matrix<ResScalar,Dynamic,1>, plain_enum_min(AlignedMax, internal::packet_traits<ResScalar>::size)> MappedDest;
231 ActualLhsType actualLhs = LhsBlasTraits::extract(lhs);
232 ActualRhsType actualRhs = RhsBlasTraits::extract(rhs);
234 ResScalar actualAlpha = combine_scalar_factors(alpha, lhs, rhs);
237 typedef typename conditional<Dest::IsVectorAtCompileTime, Dest, typename Dest::ColXpr>::type ActualDest;
242 EvalToDestAtCompileTime = (ActualDest::InnerStrideAtCompileTime==1),
243 ComplexByReal = (NumTraits<LhsScalar>::IsComplex) && (!NumTraits<RhsScalar>::IsComplex),
244 MightCannotUseDest = ((!EvalToDestAtCompileTime) || ComplexByReal) && (ActualDest::MaxSizeAtCompileTime!=0)
247 typedef const_blas_data_mapper<LhsScalar,Index,ColMajor> LhsMapper;
248 typedef const_blas_data_mapper<RhsScalar,Index,RowMajor> RhsMapper;
249 RhsScalar compatibleAlpha = get_factor<ResScalar,RhsScalar>::run(actualAlpha);
251 if(!MightCannotUseDest)
255 general_matrix_vector_product
256 <
Index,LhsScalar,LhsMapper,
ColMajor,LhsBlasTraits::NeedToConjugate,RhsScalar,RhsMapper,RhsBlasTraits::NeedToConjugate>::run(
257 actualLhs.rows(), actualLhs.cols(),
258 LhsMapper(actualLhs.data(), actualLhs.outerStride()),
259 RhsMapper(actualRhs.data(), actualRhs.innerStride()),
265 gemv_static_vector_if<ResScalar,ActualDest::SizeAtCompileTime,ActualDest::MaxSizeAtCompileTime,MightCannotUseDest> static_dest;
267 const bool alphaIsCompatible = (!ComplexByReal) || (numext::imag(actualAlpha)==RealScalar(0));
268 const bool evalToDest = EvalToDestAtCompileTime && alphaIsCompatible;
270 ei_declare_aligned_stack_constructed_variable(ResScalar,actualDestPtr,dest.size(),
271 evalToDest ? dest.data() : static_dest.data());
275 #ifdef EIGEN_DENSE_STORAGE_CTOR_PLUGIN
276 Index size = dest.size();
277 EIGEN_DENSE_STORAGE_CTOR_PLUGIN
279 if(!alphaIsCompatible)
281 MappedDest(actualDestPtr, dest.size()).setZero();
282 compatibleAlpha = RhsScalar(1);
285 MappedDest(actualDestPtr, dest.size()) = dest;
288 general_matrix_vector_product
289 <
Index,LhsScalar,LhsMapper,
ColMajor,LhsBlasTraits::NeedToConjugate,RhsScalar,RhsMapper,RhsBlasTraits::NeedToConjugate>::run(
290 actualLhs.rows(), actualLhs.cols(),
291 LhsMapper(actualLhs.data(), actualLhs.outerStride()),
292 RhsMapper(actualRhs.data(), actualRhs.innerStride()),
298 if(!alphaIsCompatible)
299 dest.matrix() += actualAlpha * MappedDest(actualDestPtr, dest.size());
301 dest = MappedDest(actualDestPtr, dest.size());
309 template<
typename Lhs,
typename Rhs,
typename Dest>
310 static void run(
const Lhs &lhs,
const Rhs &rhs, Dest& dest,
const typename Dest::Scalar& alpha)
312 typedef typename Lhs::Scalar LhsScalar;
313 typedef typename Rhs::Scalar RhsScalar;
314 typedef typename Dest::Scalar ResScalar;
316 typedef internal::blas_traits<Lhs> LhsBlasTraits;
317 typedef typename LhsBlasTraits::DirectLinearAccessType ActualLhsType;
318 typedef internal::blas_traits<Rhs> RhsBlasTraits;
319 typedef typename RhsBlasTraits::DirectLinearAccessType ActualRhsType;
320 typedef typename internal::remove_all<ActualRhsType>::type ActualRhsTypeCleaned;
322 typename add_const<ActualLhsType>::type actualLhs = LhsBlasTraits::extract(lhs);
323 typename add_const<ActualRhsType>::type actualRhs = RhsBlasTraits::extract(rhs);
325 ResScalar actualAlpha = combine_scalar_factors(alpha, lhs, rhs);
330 DirectlyUseRhs = ActualRhsTypeCleaned::InnerStrideAtCompileTime==1 || ActualRhsTypeCleaned::MaxSizeAtCompileTime==0
333 gemv_static_vector_if<RhsScalar,ActualRhsTypeCleaned::SizeAtCompileTime,ActualRhsTypeCleaned::MaxSizeAtCompileTime,!DirectlyUseRhs> static_rhs;
335 ei_declare_aligned_stack_constructed_variable(RhsScalar,actualRhsPtr,actualRhs.size(),
336 DirectlyUseRhs ?
const_cast<RhsScalar*
>(actualRhs.data()) : static_rhs.data());
340 #ifdef EIGEN_DENSE_STORAGE_CTOR_PLUGIN
341 Index size = actualRhs.size();
342 EIGEN_DENSE_STORAGE_CTOR_PLUGIN
344 Map<typename ActualRhsTypeCleaned::PlainObject>(actualRhsPtr, actualRhs.size()) = actualRhs;
347 typedef const_blas_data_mapper<LhsScalar,Index,RowMajor> LhsMapper;
348 typedef const_blas_data_mapper<RhsScalar,Index,ColMajor> RhsMapper;
349 general_matrix_vector_product
350 <
Index,LhsScalar,LhsMapper,
RowMajor,LhsBlasTraits::NeedToConjugate,RhsScalar,RhsMapper,RhsBlasTraits::NeedToConjugate>::run(
351 actualLhs.rows(), actualLhs.cols(),
352 LhsMapper(actualLhs.data(), actualLhs.outerStride()),
353 RhsMapper(actualRhsPtr, 1),
354 dest.data(), dest.col(0).innerStride(),
361 template<
typename Lhs,
typename Rhs,
typename Dest>
362 static void run(
const Lhs &lhs,
const Rhs &rhs, Dest& dest,
const typename Dest::Scalar& alpha)
364 EIGEN_STATIC_ASSERT((!nested_eval<Lhs,1>::Evaluate),EIGEN_INTERNAL_COMPILATION_ERROR_OR_YOU_MADE_A_PROGRAMMING_MISTAKE);
366 typename nested_eval<Rhs,1>::type actual_rhs(rhs);
367 const Index size = rhs.rows();
368 for(
Index k=0; k<size; ++k)
369 dest += (alpha*actual_rhs.coeff(k)) * lhs.col(k);
375 template<
typename Lhs,
typename Rhs,
typename Dest>
376 static void run(
const Lhs &lhs,
const Rhs &rhs, Dest& dest,
const typename Dest::Scalar& alpha)
378 EIGEN_STATIC_ASSERT((!nested_eval<Lhs,1>::Evaluate),EIGEN_INTERNAL_COMPILATION_ERROR_OR_YOU_MADE_A_PROGRAMMING_MISTAKE);
379 typename nested_eval<Rhs,Lhs::RowsAtCompileTime>::type actual_rhs(rhs);
380 const Index rows = dest.rows();
381 for(
Index i=0; i<rows; ++i)
382 dest.coeffRef(i) += alpha * (lhs.row(i).cwiseProduct(actual_rhs.transpose())).sum();
398template<
typename Derived>
399template<
typename OtherDerived>
400EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE
401const Product<Derived, OtherDerived>
409 ProductIsValid = Derived::ColsAtCompileTime==
Dynamic
410 || OtherDerived::RowsAtCompileTime==
Dynamic
411 || int(Derived::ColsAtCompileTime)==int(OtherDerived::RowsAtCompileTime),
412 AreVectors = Derived::IsVectorAtCompileTime && OtherDerived::IsVectorAtCompileTime,
413 SameSizes = EIGEN_PREDICATE_SAME_MATRIX_SIZE(Derived,OtherDerived)
418 EIGEN_STATIC_ASSERT(ProductIsValid || !(AreVectors && SameSizes),
419 INVALID_VECTOR_VECTOR_PRODUCT__IF_YOU_WANTED_A_DOT_OR_COEFF_WISE_PRODUCT_YOU_MUST_USE_THE_EXPLICIT_FUNCTIONS)
420 EIGEN_STATIC_ASSERT(ProductIsValid || !(SameSizes && !AreVectors),
421 INVALID_MATRIX_PRODUCT__IF_YOU_WANTED_A_COEFF_WISE_PRODUCT_YOU_MUST_USE_THE_EXPLICIT_FUNCTION)
422 EIGEN_STATIC_ASSERT(ProductIsValid || SameSizes, INVALID_MATRIX_PRODUCT)
423#ifdef EIGEN_DEBUG_PRODUCT
424 internal::product_type<Derived,OtherDerived>::debug();
441template<
typename Derived>
442template<
typename OtherDerived>
443EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE
448 ProductIsValid = Derived::ColsAtCompileTime==
Dynamic
449 || OtherDerived::RowsAtCompileTime==
Dynamic
450 || int(Derived::ColsAtCompileTime)==int(OtherDerived::RowsAtCompileTime),
451 AreVectors = Derived::IsVectorAtCompileTime && OtherDerived::IsVectorAtCompileTime,
452 SameSizes = EIGEN_PREDICATE_SAME_MATRIX_SIZE(Derived,OtherDerived)
457 EIGEN_STATIC_ASSERT(ProductIsValid || !(AreVectors && SameSizes),
458 INVALID_VECTOR_VECTOR_PRODUCT__IF_YOU_WANTED_A_DOT_OR_COEFF_WISE_PRODUCT_YOU_MUST_USE_THE_EXPLICIT_FUNCTIONS)
459 EIGEN_STATIC_ASSERT(ProductIsValid || !(SameSizes && !AreVectors),
460 INVALID_MATRIX_PRODUCT__IF_YOU_WANTED_A_COEFF_WISE_PRODUCT_YOU_MUST_USE_THE_EXPLICIT_FUNCTION)
461 EIGEN_STATIC_ASSERT(ProductIsValid || SameSizes, INVALID_MATRIX_PRODUCT)
internal::traits< Homogeneous< MatrixType, Direction_ > >::Scalar Scalar
Definition: DenseBase.h:61
Derived & derived()
Definition: EigenBase.h:48
Base class for all dense matrices, vectors, and expressions.
Definition: MatrixBase.h:52
const Product< Derived, OtherDerived, LazyProduct > lazyProduct(const MatrixBase< OtherDerived > &other) const
Definition: GeneralProduct.h:445
const Product< Derived, OtherDerived > operator*(const MatrixBase< OtherDerived > &other) const
Definition: GeneralProduct.h:402
Expression of the product of two arbitrary matrices or vectors.
Definition: Product.h:77
@ ColMajor
Definition: Constants.h:321
@ RowMajor
Definition: Constants.h:323
@ OnTheLeft
Definition: Constants.h:334
@ OnTheRight
Definition: Constants.h:336
Namespace containing all symbols from the Eigen library.
Definition: B01_Experimental.dox:1
EIGEN_DEFAULT_DENSE_INDEX_TYPE Index
The Index type as used for the API.
Definition: Meta.h:59
const int Dynamic
Definition: Constants.h:24