162struct product_type_selector<Small, Small, Large> {
163 enum { ret = GemmProduct };
166struct product_type_selector<Large, Small, Large> {
167 enum { ret = GemmProduct };
170struct product_type_selector<Small, Large, Large> {
171 enum { ret = GemmProduct };
174struct product_type_selector<Large, Large, Large> {
175 enum { ret = GemmProduct };
178struct product_type_selector<Large, Small, Small> {
179 enum { ret = CoeffBasedProductMode };
182struct product_type_selector<Small, Large, Small> {
183 enum { ret = CoeffBasedProductMode };
186struct product_type_selector<Large, Large, Small> {
187 enum { ret = GemmProduct };
220template <
int S
ide,
int StorageOrder,
bool BlasCompatible>
221struct gemv_dense_selector;
227template <
typename Scalar,
int Size,
int MaxSize,
bool Cond>
228struct gemv_static_vector_if;
230template <
typename Scalar,
int Size,
int MaxSize>
231struct gemv_static_vector_if<Scalar, Size, MaxSize, false> {
232 EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC
constexpr Scalar* data() {
233 eigen_internal_assert(
false &&
"should never be called");
238template <
typename Scalar,
int Size>
239struct gemv_static_vector_if<Scalar, Size,
Dynamic, true> {
240 EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC
constexpr Scalar* data() {
return 0; }
243template <
typename Scalar,
int Size,
int MaxSize>
244struct gemv_static_vector_if<Scalar, Size, MaxSize, true> {
245#if EIGEN_MAX_STATIC_ALIGN_BYTES != 0
246 internal::plain_array<Scalar, internal::min_size_prefer_fixed(Size, MaxSize), 0, AlignedMax> m_data;
247 EIGEN_STRONG_INLINE
constexpr Scalar* data() {
return m_data.array; }
251 internal::plain_array<Scalar, internal::min_size_prefer_fixed(Size, MaxSize) + EIGEN_MAX_ALIGN_BYTES, 0> m_data;
252 EIGEN_STRONG_INLINE
constexpr Scalar* data() {
253 return reinterpret_cast<Scalar*
>((std::uintptr_t(m_data.array) & ~(std::size_t(EIGEN_MAX_ALIGN_BYTES - 1))) +
254 EIGEN_MAX_ALIGN_BYTES);
260template <
int StorageOrder,
bool BlasCompatible>
261struct gemv_dense_selector<
OnTheLeft, StorageOrder, BlasCompatible> {
262 template <
typename Lhs,
typename Rhs,
typename Dest>
263 static void run(
const Lhs& lhs,
const Rhs& rhs, Dest& dest,
const typename Dest::Scalar& alpha) {
264 Transpose<Dest> destT(dest);
266 gemv_dense_selector<OnTheRight, OtherStorageOrder, BlasCompatible>::run(rhs.transpose(), lhs.transpose(), destT,
273 template <
typename Lhs,
typename Rhs,
typename Dest>
274 static inline void run(
const Lhs& lhs,
const Rhs& rhs, Dest& dest,
const typename Dest::Scalar& alpha) {
275 typedef typename Lhs::Scalar LhsScalar;
276 typedef typename Rhs::Scalar RhsScalar;
277 typedef typename Dest::Scalar ResScalar;
279 typedef internal::blas_traits<Lhs> LhsBlasTraits;
280 typedef typename LhsBlasTraits::DirectLinearAccessType ActualLhsType;
281 typedef internal::blas_traits<Rhs> RhsBlasTraits;
282 typedef typename RhsBlasTraits::DirectLinearAccessType ActualRhsType;
284 typedef Map<Matrix<ResScalar, Dynamic, 1>, plain_enum_min(AlignedMax, internal::packet_traits<ResScalar>::size)>
287 ActualLhsType actualLhs = LhsBlasTraits::extract(lhs);
288 ActualRhsType actualRhs = RhsBlasTraits::extract(rhs);
290 ResScalar actualAlpha = combine_scalar_factors(alpha, lhs, rhs);
293 typedef std::conditional_t<Dest::IsVectorAtCompileTime, Dest, typename Dest::ColXpr> ActualDest;
298 EvalToDestAtCompileTime = (ActualDest::InnerStrideAtCompileTime == 1),
299 ComplexByReal = (NumTraits<LhsScalar>::IsComplex) && (!NumTraits<RhsScalar>::IsComplex),
300 MightCannotUseDest = ((!EvalToDestAtCompileTime) || ComplexByReal) && (ActualDest::MaxSizeAtCompileTime != 0)
303 typedef const_blas_data_mapper<LhsScalar, Index, ColMajor> LhsMapper;
304 typedef const_blas_data_mapper<RhsScalar, Index, RowMajor> RhsMapper;
305 RhsScalar compatibleAlpha = get_factor<ResScalar, RhsScalar>::run(actualAlpha);
307 if (!MightCannotUseDest) {
310 general_matrix_vector_product<
Index, LhsScalar, LhsMapper,
ColMajor, LhsBlasTraits::NeedToConjugate, RhsScalar,
311 RhsMapper, RhsBlasTraits::NeedToConjugate>::run(actualLhs.rows(), actualLhs.cols(),
312 LhsMapper(actualLhs.data(),
313 actualLhs.outerStride()),
314 RhsMapper(actualRhs.data(),
315 actualRhs.innerStride()),
316 dest.data(), 1, compatibleAlpha);
318 gemv_static_vector_if<ResScalar, ActualDest::SizeAtCompileTime, ActualDest::MaxSizeAtCompileTime,
322 const bool alphaIsCompatible = (!ComplexByReal) || (numext::is_exactly_zero(numext::imag(actualAlpha)));
323 const bool evalToDest = EvalToDestAtCompileTime && alphaIsCompatible;
325 ei_declare_aligned_stack_constructed_variable(ResScalar, actualDestPtr, dest.size(),
326 evalToDest ? dest.data() : static_dest.data());
329#ifdef EIGEN_DENSE_STORAGE_CTOR_PLUGIN
330 constexpr int Size = Dest::SizeAtCompileTime;
331 Index size = dest.size();
332 EIGEN_DENSE_STORAGE_CTOR_PLUGIN
334 if (!alphaIsCompatible) {
335 MappedDest(actualDestPtr, dest.size()).setZero();
336 compatibleAlpha = RhsScalar(1);
338 MappedDest(actualDestPtr, dest.size()) = dest;
341 general_matrix_vector_product<
Index, LhsScalar, LhsMapper,
ColMajor, LhsBlasTraits::NeedToConjugate, RhsScalar,
342 RhsMapper, RhsBlasTraits::NeedToConjugate>::run(actualLhs.rows(), actualLhs.cols(),
343 LhsMapper(actualLhs.data(),
344 actualLhs.outerStride()),
345 RhsMapper(actualRhs.data(),
346 actualRhs.innerStride()),
347 actualDestPtr, 1, compatibleAlpha);
350 if (!alphaIsCompatible)
351 dest.matrix() += actualAlpha * MappedDest(actualDestPtr, dest.size());
353 dest = MappedDest(actualDestPtr, dest.size());
361 template <
typename Lhs,
typename Rhs,
typename Dest>
362 static void run(
const Lhs& lhs,
const Rhs& rhs, Dest& dest,
const typename Dest::Scalar& alpha) {
363 typedef typename Lhs::Scalar LhsScalar;
364 typedef typename Rhs::Scalar RhsScalar;
365 typedef typename Dest::Scalar ResScalar;
367 typedef internal::blas_traits<Lhs> LhsBlasTraits;
368 typedef typename LhsBlasTraits::DirectLinearAccessType ActualLhsType;
369 typedef internal::blas_traits<Rhs> RhsBlasTraits;
370 typedef typename RhsBlasTraits::DirectLinearAccessType ActualRhsType;
371 typedef internal::remove_all_t<ActualRhsType> ActualRhsTypeCleaned;
373 std::add_const_t<ActualLhsType> actualLhs = LhsBlasTraits::extract(lhs);
374 std::add_const_t<ActualRhsType> actualRhs = RhsBlasTraits::extract(rhs);
376 ResScalar actualAlpha = combine_scalar_factors(alpha, lhs, rhs);
382 ActualRhsTypeCleaned::InnerStrideAtCompileTime == 1 || ActualRhsTypeCleaned::MaxSizeAtCompileTime == 0
385 gemv_static_vector_if<RhsScalar, ActualRhsTypeCleaned::SizeAtCompileTime,
386 ActualRhsTypeCleaned::MaxSizeAtCompileTime, !DirectlyUseRhs>
389 ei_declare_aligned_stack_constructed_variable(
390 RhsScalar, actualRhsPtr, actualRhs.size(),
391 DirectlyUseRhs ?
const_cast<RhsScalar*
>(actualRhs.data()) : static_rhs.data());
393 if (!DirectlyUseRhs) {
394#ifdef EIGEN_DENSE_STORAGE_CTOR_PLUGIN
395 constexpr int Size = ActualRhsTypeCleaned::SizeAtCompileTime;
396 Index size = actualRhs.size();
397 EIGEN_DENSE_STORAGE_CTOR_PLUGIN
399 Map<typename ActualRhsTypeCleaned::PlainObject>(actualRhsPtr, actualRhs.size()) = actualRhs;
402 typedef const_blas_data_mapper<LhsScalar, Index, RowMajor> LhsMapper;
403 typedef const_blas_data_mapper<RhsScalar, Index, ColMajor> RhsMapper;
404 general_matrix_vector_product<
Index, LhsScalar, LhsMapper,
RowMajor, LhsBlasTraits::NeedToConjugate, RhsScalar,
405 RhsMapper, RhsBlasTraits::NeedToConjugate>::
406 run(actualLhs.rows(), actualLhs.cols(), LhsMapper(actualLhs.data(), actualLhs.outerStride()),
407 RhsMapper(actualRhsPtr, 1), dest.data(),
408 dest.col(0).innerStride(),
416 template <
typename Lhs,
typename Rhs,
typename Dest>
417 static void run(
const Lhs& lhs,
const Rhs& rhs, Dest& dest,
const typename Dest::Scalar& alpha) {
418 EIGEN_STATIC_ASSERT((!nested_eval<Lhs, 1>::Evaluate),
419 EIGEN_INTERNAL_COMPILATION_ERROR_OR_YOU_MADE_A_PROGRAMMING_MISTAKE);
422 typename nested_eval<Rhs, 1>::type actual_rhs(rhs);
423 const Index size = rhs.rows();
424 for (Index k = 0; k < size; ++k) dest += (alpha * actual_rhs.coeff(k)) * lhs.col(k);
430 template <
typename Lhs,
typename Rhs,
typename Dest>
431 static void run(
const Lhs& lhs,
const Rhs& rhs, Dest& dest,
const typename Dest::Scalar& alpha) {
432 EIGEN_STATIC_ASSERT((!nested_eval<Lhs, 1>::Evaluate),
433 EIGEN_INTERNAL_COMPILATION_ERROR_OR_YOU_MADE_A_PROGRAMMING_MISTAKE);
434 typename nested_eval<Rhs, Lhs::RowsAtCompileTime>::type actual_rhs(rhs);
435 const Index rows = dest.rows();
436 for (Index i = 0; i < rows; ++i)
437 dest.coeffRef(i) += alpha * (lhs.row(i).cwiseProduct(actual_rhs.transpose())).sum();
453template <
typename Derived>
454template <
typename OtherDerived>
456 const MatrixBase<OtherDerived>& other)
const {
462 ProductIsValid = Derived::ColsAtCompileTime ==
Dynamic || OtherDerived::RowsAtCompileTime ==
Dynamic ||
463 int(Derived::ColsAtCompileTime) == int(OtherDerived::RowsAtCompileTime),
464 AreVectors = Derived::IsVectorAtCompileTime && OtherDerived::IsVectorAtCompileTime,
465 SameSizes = EIGEN_PREDICATE_SAME_MATRIX_SIZE(Derived, OtherDerived)
471 ProductIsValid || !(AreVectors && SameSizes),
472 INVALID_VECTOR_VECTOR_PRODUCT__IF_YOU_WANTED_A_DOT_OR_COEFF_WISE_PRODUCT_YOU_MUST_USE_THE_EXPLICIT_FUNCTIONS)
473 EIGEN_STATIC_ASSERT(ProductIsValid || !(SameSizes && !AreVectors),
474 INVALID_MATRIX_PRODUCT__IF_YOU_WANTED_A_COEFF_WISE_PRODUCT_YOU_MUST_USE_THE_EXPLICIT_FUNCTION)
475 EIGEN_STATIC_ASSERT(ProductIsValid || SameSizes, INVALID_MATRIX_PRODUCT)
476#ifdef EIGEN_DEBUG_PRODUCT
477 internal::product_type<Derived, OtherDerived>::debug();
494template <
typename Derived>
495template <
typename OtherDerived>
499 ProductIsValid = Derived::ColsAtCompileTime ==
Dynamic || OtherDerived::RowsAtCompileTime ==
Dynamic ||
500 int(Derived::ColsAtCompileTime) == int(OtherDerived::RowsAtCompileTime),
501 AreVectors = Derived::IsVectorAtCompileTime && OtherDerived::IsVectorAtCompileTime,
502 SameSizes = EIGEN_PREDICATE_SAME_MATRIX_SIZE(Derived, OtherDerived)
508 ProductIsValid || !(AreVectors && SameSizes),
509 INVALID_VECTOR_VECTOR_PRODUCT__IF_YOU_WANTED_A_DOT_OR_COEFF_WISE_PRODUCT_YOU_MUST_USE_THE_EXPLICIT_FUNCTIONS)
510 EIGEN_STATIC_ASSERT(ProductIsValid || !(SameSizes && !AreVectors),
511 INVALID_MATRIX_PRODUCT__IF_YOU_WANTED_A_COEFF_WISE_PRODUCT_YOU_MUST_USE_THE_EXPLICIT_FUNCTION)
512 EIGEN_STATIC_ASSERT(ProductIsValid || SameSizes, INVALID_MATRIX_PRODUCT)